
    Ng2                        d dl Z d dlmZ d dlmZ d dlmZ  eddg          Z e j        e           e j	                    d	                         Z
e
                    d
           e j        dddd           e j        ddddd           e j        dddd           e j        dddd           e j        dddd          d                                                                          ZdS )!    N)tqdm)word_tokenize)parallelize_preprocessz-hz--help)help_option_names)context_settingsc                      d S )N r	       D/var/www/html/ai-engine/env/lib/python3.11/site-packages/nltk/cli.pyclir      s	     	Dr
   tokenizez
--languagez-lenz1The language for the Punkt sentence tokenization.)defaulthelpz--preserve-lineTzIAn option to keep the preserve the sentence and not sentence tokenize it.)r   is_flagr   z--processesz-j   zNo. of processes.z
--encodingz-eutf8zSpecify encoding of file.z--delimiterz-d z%Specify delimiter to join the tokens.c           
         t          j        d|          5 }t          j        d|          5 }|dk    rWt          |                                          D ]4}t	          |                    t          |                    d|           5nRt          t          |                                |d          D ]'}t	          |                    |          d|           (d	d	d	           n# 1 swxY w Y   d	d	d	           d	S # 1 swxY w Y   d	S )
z;This command tokenizes text stream using nltk.word_tokenizestdin)encodingstdoutr   
)endfileT)progress_barN)clickget_text_streamr   	readlinesprintjoinr   r   )	languagepreserve_line	processesr   	delimiterfinfoutlineoutlines	            r   tokenize_filer*      s   * 
	w	:	:	: Hc"8h??? 
	H4 A~~ 11 T TD)..t)<)<==4dSSSSST  6!3==??ID      H HG )..11t$GGGGG
	H 
	H 
	H 
	H 
	H 
	H 
	H 
	H 
	H 
	H 
	H 
	H 
	H 
	H 
	HH H H H H H H H H H H H H H H H H Hs5   DB0C*D*C.	.D1C.	2DD	D)r   r   nltkr   	nltk.utilr   dictCONTEXT_SETTINGSgroupversion_optionr   commandoptionr*   r	   r
   r   <module>r3      s                , , , , , ,44*:;;;  .///	 	  0/	 Z	<	   	T   mT13FGGGlD&7RSSS4+R  H H  TS HG   &H H Hr
   