U
    <A·fƒ  ã                   @   s’   d dl Z d dlZd dlZd dlmZ d dlmZmZmZm	Z	 d dl
Zd dlZd dlmZ d dlmZ ertd dlmZ e e¡ZG dd„ deƒZdS )	é    N)Únullcontext)ÚTYPE_CHECKINGÚDictÚListÚOptional)ÚSentenceEvaluator)Úpytorch_cos_sim)ÚSentenceTransformerc                
       sb   e Zd ZdZdee ee eeeeeee dœ‡ fdd	„Z	ddeeee
eef dœdd„Z‡  ZS )ÚTranslationEvaluatora  
    Given two sets of sentences in different languages, e.g. (en_1, en_2, en_3...) and (fr_1, fr_2, fr_3, ...),
    and assuming that fr_i is the translation of en_i.
    Checks if vec(en_i) has the highest similarity to vec(fr_i). Computes the accuracy in both directions

    Example:
        ::

            from sentence_transformers import SentenceTransformer
            from sentence_transformers.evaluation import TranslationEvaluator
            from datasets import load_dataset

            # Load a model
            model = SentenceTransformer('paraphrase-multilingual-mpnet-base-v2')

            # Load a parallel sentences dataset
            dataset = load_dataset("sentence-transformers/parallel-sentences-news-commentary", "en-nl", split="train[:1000]")

            # Initialize the TranslationEvaluator using the same texts from two languages
            translation_evaluator = TranslationEvaluator(
                source_sentences=dataset["english"],
                target_sentences=dataset["non_english"],
                name="news-commentary-en-nl",
            )
            results = translation_evaluator(model)
            '''
            Evaluating translation matching Accuracy of the model on the news-commentary-en-nl dataset:
            Accuracy src2trg: 90.80
            Accuracy trg2src: 90.40
            '''
            print(translation_evaluator.primary_metric)
            # => "news-commentary-en-nl_mean_accuracy"
            print(results[translation_evaluator.primary_metric])
            # => 0.906
    Fé   Ú TN)Úsource_sentencesÚtarget_sentencesÚshow_progress_barÚ
batch_sizeÚnameÚprint_wrong_matchesÚ	write_csvÚtruncate_dimc	           	         s„   t ƒ  ¡  || _|| _|| _|| _|| _|| _|| _t	| jƒt	| jƒksLt
‚|rXd| }d| d | _ddddg| _|| _d| _d	S )
aå  
        Constructs an evaluator based for the dataset

        The labels need to indicate the similarity between the sentences.

        Args:
            source_sentences (List[str]): List of sentences in the source language.
            target_sentences (List[str]): List of sentences in the target language.
            show_progress_bar (bool): Whether to show a progress bar when computing embeddings. Defaults to False.
            batch_size (int): The batch size to compute sentence embeddings. Defaults to 16.
            name (str): The name of the evaluator. Defaults to an empty string.
            print_wrong_matches (bool): Whether to print incorrect matches. Defaults to False.
            write_csv (bool): Whether to write the evaluation results to a CSV file. Defaults to True.
            truncate_dim (int, optional): The dimension to truncate sentence embeddings to. If None, the model's
                current truncation dimension will be used. Defaults to None.
        Ú_Ztranslation_evaluationz_results.csvÚepochÚstepsZsrc2trgZtrg2srcÚmean_accuracyN)ÚsuperÚ__init__r   r   r   r   r   r   r   ÚlenÚAssertionErrorÚcsv_fileÚcsv_headersr   Zprimary_metric)	Úselfr   r   r   r   r   r   r   r   ©Ú	__class__© úY/tmp/pip-unpacked-wheel-i7fohqg6/sentence_transformers/evaluation/TranslationEvaluator.pyr   8   s    
zTranslationEvaluator.__init__éÿÿÿÿr	   )ÚmodelÚoutput_pathr   r   Úreturnc              	   C   s  |dkr0|dkrd|› }q4d|› d|› d}nd}| j d k	rP|d| j › d7 }t d	| j› d
|› d¡ | j d krztƒ n
| | j ¡B t |j| j	| j
| jdd¡}t |j| j| j
| jdd¡}W 5 Q R X t||ƒ ¡  ¡  ¡ }d}	d}
tt|ƒƒD ]ê}t || ¡}||kr|	d7 }	qø| jrøtd|d|d|ƒ td| j	| ƒ td| j| d|| | d›dƒ td| j| d|| | d›dƒ t|| ƒ}t|dd„ dd}|d d… D ](\}}td|d|d›d| j| ƒ q¸qø|j}tt|ƒƒD ]&}t || ¡}||krö|
d7 }
qö|	t|ƒ }|
t|ƒ }t d |d ¡¡ t d  |d ¡¡ |d k	rà| jràtj || j¡}tj  |¡}t!|d|rœd!nd"d#d$4}t" #|¡}|sÄ| $| j%¡ | $||||g¡ W 5 Q R X |||| d% d&œ}|  &|| j¡}|  '||¡ |S )'Nr$   z after epoch z
 in epoch z after z stepsr   z (truncated to ú)z=Evaluating translation matching Accuracy of the model on the z datasetú:F)r   r   Zconvert_to_numpyr   é   z
Incorrect  : Sourcezis most similar to targetzinstead of targetzSource     :zPred Target:z(Score: z.4fzTrue Target:c                 S   s   | d S )Nr*   r"   )Úxr"   r"   r#   Ú<lambda>˜   ó    z/TranslationEvaluator.__call__.<locals>.<lambda>T)ÚkeyÚreverseé   ú	zAccuracy src2trg: {:.2f}éd   zAccuracy trg2src: {:.2f}ÚaÚwzutf-8)ÚnewlineÚmodeÚencodingé   )Zsrc2trg_accuracyZtrg2src_accuracyr   )(r   ÚloggerÚinfor   r   Ztruncate_sentence_embeddingsÚtorchÚstackÚencoder   r   r   r   r   ÚdetachÚcpuÚnumpyÚranger   ÚnpZargmaxr   ÚprintÚ	enumerateÚsortedÚTÚformatr   ÚosÚpathÚjoinr   ÚisfileÚopenÚcsvÚwriterÚwriterowr   Zprefix_name_to_metricsZ store_metrics_in_model_card_data)r   r%   r&   r   r   Zout_txtZembeddings1Zembeddings2Zcos_simsZcorrect_src2trgZcorrect_trg2srcÚiZmax_idxÚresultsÚidxZscoreZacc_src2trgZacc_trg2srcZcsv_pathZoutput_file_existsÚfrN   Zmetricsr"   r"   r#   Ú__call__f   s‚    
üÿüÿ	

$$$


ýzTranslationEvaluator.__call__)Fr   r   FTN)Nr$   r$   )Ú__name__Ú
__module__Ú__qualname__Ú__doc__r   ÚstrÚboolÚintr   r   r   ÚfloatrT   Ú__classcell__r"   r"   r    r#   r
      s6   (      ÷÷/     ÿ   
þr
   )rM   ÚloggingrH   Ú
contextlibr   Útypingr   r   r   r   r@   rB   r;   Z2sentence_transformers.evaluation.SentenceEvaluatorr   Zsentence_transformers.utilr   Z)sentence_transformers.SentenceTransformerr	   Ú	getLoggerrU   r9   r
   r"   r"   r"   r#   Ú<module>   s   