
    ^i]                     Z    d dl mZ d dlmZ d dlmZmZ d dlmZm	Z	 d dl
mZ d Zd Zd Zy	)
    )unicode_literals)chain)	text_type
bytes_type)RE_HANSPHRASES_DICT)mmsegc                    t        |       } g }| D ]x  }t        j                  |      s|j                  |       *t        r8|j                  t        t        j                  j                  |                   h|j                  |       z |S )N)

simple_segr   matchappendr   extendlistr	   segcut)hansretxs      R/mnt/e/genesis-system/.venv/lib/python3.12/site-packages/pypinyin/seg/simpleseg.pyr   r      sj    dD
C }}QJJqMJJtEIIMM!,-.JJqM J    c           
         t        | t              rJ d       t        | t              rt        |       S t	        |       } t        |       dk(  rt        | d         S t	        t        | D cg c]  }t        |       c}       S c c}w )u0   将传入的字符串按是否是汉字来分割z-must be unicode string or [unicode, ...] list   r   )
isinstancer   r   _segr   lenr   r   )r   r   s     r   r   r      sw    $
+ 878+ $	"DzDzt9>d1g&&E48aJqM89::8s   (Bc                 "   d}g }d}t        |       D ]i  \  }}t        j                  |      r(|dk(  rd}|dk(  r||z  }-|j                  |       d}|}C|dk(  rd}|dk(  r||z  }U|j                  |       d}|}k |j                  |       |S )u   按是否是汉字进行分词 r   r   )	enumerater   r   r   )charssr   flagncs         r   r   r   &   s    
A
CD%  1==AvqyQ

1 AvqyQ

1+. JJqMJr   N)
__future__r   	itertoolsr   pypinyin.compatr   r   pypinyin.constantsr   r   pypinyin.segr	   r   r   r    r   r   <module>r*      s#    '  1 4 
;r   