
    j%                        d dl mZmZmZ d dlZd dlmZmZ  ej                    d             Z	e	
                                 ej        ded           ej        ded	           ej        d
edd           ej        dedd           ej        dedd           ej        ded           ej        deeefddd           ej        ddddd          	 	 	 d,deded ed!eeeef         d"ed#eee                  d$eee                  d%ee         fd&                                                                                                            Ze	
                                 ej        ded           ej        ded'           ej        d
edd(           ej        dedd)           ej        dedd           ej        ddddd          	 	 d-deded ed"ed#eee                  d$eee                  fd*                                                                                    Zed+k    r e	             dS dS ).    )ListOptionalTupleN)measure_element_type_accuracy measure_text_extraction_accuracyc                      d S N r
       f/lsinfo/ai/hellotax_ai/base_platform/venv/lib/python3.11/site-packages/unstructured/ingest/evaluate.pymainr      s    Dr   z--output_dirzDirectory to structured output.)typehelpz--source_dirzDirectory to source.z--output_listTzOptional: list of selected structured output file names under the         directory to be evaluate. If none, all files under directory will be use.)r   multipler   z--source_listzOptional: list of selected source file names under the directory         to be evaluate. If none, all files under directory will be use.z--export_dirmetricsz`Directory to save the output evaluation metrics to. Default to         your/working/dir/metrics/)r   defaultr   z
--groupingz5Input field for aggregration, or leave blank if none.z	--weights)      r   zA list of weights to the Levenshtein distance calculation. Takes input as --weights 2 2 2        See text_extraction.py/calculate_edit_distance for more details.)r   r   show_defaultr   z--visualizeFz"Add the flag to show progress bar.)is_flagr   r   r   
output_dir
source_dir
export_dirweights	visualizeoutput_listsource_listgroupingc           
      .    t          | |||||||          S r	   )r   )r   r   r   r   r   r   r   r   s           r   (measure_text_extraction_accuracy_commandr       s*    d ,J[*hPWYb  r   zDirectory to structured source.zOptional: list of selected structured output file names under the         directory to be evaluate. If none, all files under directory will be used.zOptional: list of selected source file names under the directory         to be evaluate. If none, all files under directory will be used.c                 *    t          | |||||          S r	   )r   )r   r   r   r   r   r   s         r   %measure_element_type_accuracy_commandr"   I   s$    N )J[*i  r   __main__)NNN)NN)typingr   r   r   clickunstructured.metrics.evaluater   r   groupr   commandoptionstrintboolr    r"   __name__r
   r   r   <module>r.      s   ) ( ( ( ( ( ( ( ( (         	 	 	 n3-NOOOn3-CDDD	
S	   	
I	   	
#	   l+bccc
sC
J   	-   (,'+"   3S=!	
  $s)$ $s)$ sm     dc    ED PO P n3-NOOOn3-NOOO	
T	   	
J	   	
#	   	-   (,'+
 


 
 	

 $s)$
 $s)$
 
 
     PO PO >
 zDFFFFF r   