
    !}gf                         d dl mZmZmZmZ d dl mZmZ d dlmZ d dl	Z	d dl
Z
 ed          Z e
j        d          Z G d de          Zed	ed
fdZdS )    )RegexAnalyzerLowercaseFilter
StopFilter
StemFilter)	TokenizerToken)stemN)%aanandareasatbebycanforfromhaveifinisitmaynotofonortbdthatthethistouswewhenwillwithyetyouyouru   的u   了u   和z[\u4E00-\u9FA5]+c                       e Zd Zd ZdS )ChineseTokenizerc              +     K   t          j        |d          }t                      }|D ][\  }}}t                              |          st          |          dk    r4|x|_        |_        ||_        ||_	        ||_
        |V  \d S )Nsearch)mode   )jiebatokenizer   accepted_charsmatchlenoriginaltextpos	startcharendchar)selfr8   kargswordstokenw	start_posstop_poss           V/var/www/py-google-trends/myenv/lib/python3.11/site-packages/jieba/analyse/analyzer.py__call__zChineseTokenizer.__call__   s      t(333&+ 	 	"Qy!''** s1vvqyy*++ENUZ!EI'EO$EMKKKK	 	    N)__name__
__module____qualname__rD    rE   rC   r-   r-      s#        
 
 
 
 
rE   r-   r1   iP  c                     t                      t                      z  t          | |          z  t          |d |          z  S )N)stoplistminsize)stemfnignore	cachesize)r-   r   r   r   )rK   rL   rM   rO   s       rC   ChineseAnalyzerrP      sI    !2!22999:fTIFFFG HrE   )whoosh.analysisr   r   r   r   r   r   whoosh.lang.porterr	   r2   re	frozenset
STOP_WORDScompiler4   r-   rP   rI   rE   rC   <module>rW      s    O O O O O O O O O O O O + + + + + + + + # # # # # #  				Y < = =
 /00    y    (45 H H H H H HrE   