U
    <A·fة  م                   @   sڑ   d dl Z d dlZd dlmZmZmZmZmZmZ d dl	m
  mZ d dlmZm
Z
 d dlmZ d dlmZ d dlmZ G dd„ dƒZG d	d
„ d
e
jƒZdS )é    N)عAnyعDictعIterableعListعOptionalعUnion)عTensorعnn)عSentenceTransformer)عCachedGISTEmbedLoss)ع"CachedMultipleNegativesRankingLossc                   @   sX   e Zd Zddœdd„Zddœdd„Zeedœdd	„Zeeef eeef d
œdd„Z	dS )عForwardDecoratorN©عreturnc                 C   s"   || _ d | _g | _d | _d| _d S ©Nr   )عfnعdimعcacheع	cache_dimعidx)عselfr   © r   ْO/tmp/pip-unpacked-wheel-i7fohqg6/sentence_transformers/losses/MatryoshkaLoss.pyع__init__   s
    zForwardDecorator.__init__c                 C   s   || _ d| _d S r   )r   r   )r   r   r   r   r   عset_dim   s    zForwardDecorator.set_dim)عtensorr   c                 C   sP   |j d }| j|kr*td| j› d|› ‌ƒ‚|dd | j…f }tj|dddچ}|S )Néےےےےz
Dimension zL in matryoshka_dims cannot be greater than the model's embedding dimension: .é   )عpr   )عshaper   ع
ValueErrorعFع	normalize)r   r   Z
tensor_dimr   r   r   عshrink   s    

ےzForwardDecorator.shrink)عfeaturesr   c                 C   sx   | j d ks| j | jkr6|  |،}| j |، | j| _ n| j| j }|  |d ،|d< |  |d ،|d< |  jd7  _|S )NZtoken_embeddingsZsentence_embeddingé   )r   r   r   r   عappendr   r#   )r   r$   عoutputr   r   r   ع__call__$   s    

zForwardDecorator.__call__)
ع__name__ع
__module__ع__qualname__r   r   r   r#   r   عstrr(   r   r   r   r   r      s   
r   c                	       sٹ   e Zd Zdeejee eee	e
ef   eddœ‡ fdd„Zeeeef  eedœdd„Zeeef d	œd
d„Zeed	œdd„ƒZ‡  ZS )عMatryoshkaLossNr   )عmodelعlossعmatryoshka_dimsعmatryoshka_weightsعn_dims_per_stepr   c                    sژ   t ƒ  ،  || _|| _t|tƒr.tjdddچ t|tƒrFtjdddچ |dkr\dgt	|ƒ }t
||ƒ}t
t|dd„ d	d
چژ \| _| _|| _dS )a  
        The MatryoshkaLoss can be seen as a loss *modifier* that allows you to use other loss functions at various
        different embedding dimensions. This is useful for when you want to train a model where users have the option
        to lower the embedding dimension to improve their embedding comparison speed and costs.

        Args:
            model: SentenceTransformer model
            loss: The loss function to be used, e.g.
                :class:`MultipleNegativesRankingLoss`,
                :class:`CoSENTLoss`, etc.
            matryoshka_dims: A list of embedding dimensions to be used
                for the loss function, e.g. [768, 512, 256, 128, 64].
            matryoshka_weights: A list of weights to be used for the
                loss function, e.g. [1, 1, 1, 1, 1]. If None, then the
                weights will be set to 1 for all dimensions.
            n_dims_per_step: The number of dimensions to use per step.
                If -1, then all dimensions are used. If > 0, then a
                random sample of n_dims_per_step dimensions are used per
                step. The default value is -1.

        References:
            - The concept was introduced in this paper: https://arxiv.org/abs/2205.13147
            - `Matryoshka Embeddings <../../examples/training/matryoshka/README.html>`_

        Requirements:
            1. The base loss cannot be :class:`CachedMultipleNegativesRankingLoss` or :class:`CachedGISTEmbedLoss`.

        Relations:
            - :class:`Matryoshka2dLoss` uses this loss in combination with :class:`AdaptiveLayerLoss` which allows for
                layer reduction for faster inference.

        Input:
            +---------------------------------------+--------+
            | Texts                                 | Labels |
            +=======================================+========+
            | any                                   | any    |
            +---------------------------------------+--------+

        Example:
            ::

                from sentence_transformers import SentenceTransformer, losses, InputExample
                from torch.utils.data import DataLoader

                model = SentenceTransformer("microsoft/mpnet-base")
                train_examples = [
                    InputExample(texts=['Anchor 1', 'Positive 1']),
                    InputExample(texts=['Anchor 2', 'Positive 2']),
                ]
                train_dataloader = DataLoader(train_examples, shuffle=True, batch_size=32)
                train_loss = losses.MultipleNegativesRankingLoss(model=model)
                train_loss = losses.MatryoshkaLoss(model, train_loss, [768, 512, 256, 128, 64])
                model.fit(
                    [(train_dataloader, train_loss)],
                    epochs=10,
                )
        zIMatryoshkaLoss is not compatible with CachedMultipleNegativesRankingLoss.r   )ع
stacklevelz:MatryoshkaLoss is not compatible with CachedGISTEmbedLoss.Nr%   c                 S   s   | d S r   r   )عxr   r   r   ع<lambda>پ   َ    z)MatryoshkaLoss.__init__.<locals>.<lambda>T)عkeyعreverse)عsuperr   r.   r/   ع
isinstancer   عwarningsعwarnr   عlenعzipعsortedr0   r1   r2   )r   r.   r/   r0   r1   r2   Zdims_weights©ع	__class__r   r   r   4   s    A



zMatryoshkaLoss.__init__)عsentence_featuresعlabelsr   c           
      C   s    | j j}zˆt|ƒ}|| j _tt| jƒƒ}| jdkrN| jt|ƒk rNt || j،}d}|D ]6}| j| }| j	| }	| 
|، ||	|  ||، 7 }qVW 5 || j _X |S )Nr   g        )r.   عforwardr   عranger=   r0   r2   عrandomعsampler1   r   r/   )
r   rB   rC   Zoriginal_forwardZdecorated_forwardZdim_indicesr/   r   r   Zweightr   r   r   rD   „   s    



zMatryoshkaLoss.forwardr   c                 C   s   | j jj| j| j| jdœS )N)r/   r0   r1   r2   )r/   rA   r)   r0   r1   r2   ©r   r   r   r   عget_config_dictک   s
    üzMatryoshkaLoss.get_config_dictc                 C   s   dS )Naٹ  
@misc{kusupati2024matryoshka,
    title={Matryoshka Representation Learning}, 
    author={Aditya Kusupati and Gantavya Bhatt and Aniket Rege and Matthew Wallingford and Aditya Sinha and Vivek Ramanujan and William Howard-Snyder and Kaifeng Chen and Sham Kakade and Prateek Jain and Ali Farhadi},
    year={2024},
    eprint={2205.13147},
    archivePrefix={arXiv},
    primaryClass={cs.LG}
}
r   rH   r   r   r   عcitation    s    zMatryoshkaLoss.citation)Nr   )r)   r*   r+   r
   r	   عModuler   عintr   r   عfloatr   r   r   r,   r   rD   r   rI   عpropertyrJ   ع__classcell__r   r   r@   r   r-   3   s     ْùPr-   )rF   r;   عtypingr   r   r   r   r   r   Ztorch.nn.functionalr	   Z
functionalr!   Ztorchr   Zsentence_transformersr
   Z0sentence_transformers.losses.CachedGISTEmbedLossr   Z?sentence_transformers.losses.CachedMultipleNegativesRankingLossr   r   rK   r-   r   r   r   r   ع<module>   s    &