
    hu                     j    d dl mZ d dlmZmZmZmZ ddlmZm	Z	 ddl
mZmZ ddlmZ  G d de      Zy	)
    )Path)AnyCallableOptionalUnion   )default_loadermake_dataset)download_and_extract_archiveverify_str_arg)VisionDatasetc                        e Zd ZdZdZdZddddefdeee	f   ded	e
e   d
e
e   dedeegef   ddf fdZdefdZdedeeef   fdZdefdZdefdZddZ xZS )RenderedSST2an  `The Rendered SST2 Dataset <https://github.com/openai/CLIP/blob/main/data/rendered-sst2.md>`_.

    Rendered SST2 is an image classification dataset used to evaluate the models capability on optical
    character recognition. This dataset was generated by rendering sentences in the Standford Sentiment
    Treebank v2 dataset.

    This dataset contains two classes (positive and negative) and is divided in three splits: a  train
    split containing 6920 images (3610 positive and 3310 negative), a validation split containing 872 images
    (444 positive and 428 negative), and a test split containing 1821 images (909 positive and 912 negative).

    Args:
        root (str or ``pathlib.Path``): Root directory of the dataset.
        split (string, optional): The dataset split, supports ``"train"`` (default), `"val"` and ``"test"``.
        transform (callable, optional): A function/transform that takes in a PIL image or torch.Tensor, depends on the given loader,
            and returns a transformed version. E.g, ``transforms.RandomCrop``
        target_transform (callable, optional): A function/transform that takes in the target and transforms it.
        download (bool, optional): If True, downloads the dataset from the internet and
            puts it in root directory. If dataset is already downloaded, it is not
            downloaded again. Default is False.
        loader (callable, optional): A function to load an image given its path.
            By default, it uses PIL as its image loader, but users could also pass in
            ``torchvision.io.decode_image`` for decoding image data into tensors directly.
    z>https://openaipublic.azureedge.net/clip/data/rendered-sst2.tgz 2384d08e9dcfa4bd55b324e610496ee5trainNFrootsplit	transformtarget_transformdownloadloaderreturnc                    t         |   |||       t        |dd      | _        dddd| _        t        | j                        dz  | _        dd	g| _        d
dd| _	        |r| j                          | j                         st        d      t        t        | j                  | j                  | j                     z        d      | _        || _        y )N)r   r   r   )r   valtestr   validr   zrendered-sst2negativepositiver   r   )r   r   z;Dataset not found. You can use download=True to download it)png)
extensions)super__init__r   _split_split_to_folderr   r   _base_folderclassesclass_to_idx	_download_check_existsRuntimeErrorr
   str_samplesr   )selfr   r   r   r   r   r   	__class__s          `/var/www/html/eduruby.in/venv/lib/python3.12/site-packages/torchvision/datasets/rendered_sst2.pyr"   zRenderedSST2.__init__%   s     	EUV$UG5MN*1'6 R Oo="J/)*:NN!!#\]]$S):):T=R=RSWS^S^=_)_%`muv    c                 ,    t        | j                        S N)lenr,   r-   s    r/   __len__zRenderedSST2.__len__>   s    4==!!r0   idxc                     | j                   |   \  }}| j                  |      }| j                  r| j                  |      }| j                  r| j                  |      }||fS r2   )r,   r   r   r   )r-   r6   
image_filelabelimages        r/   __getitem__zRenderedSST2.__getitem__A   s[     MM#.
EJ'>>NN5)E  ))%0Ee|r0   c                      d| j                    S )Nzsplit=)r#   r4   s    r/   
extra_reprzRenderedSST2.extra_reprM   s    }%%r0   c                     t        | j                        D ];  }| j                  | j                  | j                     z  |z  j                         r; y y)NFT)setr&   r%   r$   r#   is_dir)r-   class_labels     r/   r)   zRenderedSST2._check_existsP   sM    t||, 	K%%(=(=dkk(JJ[X``b	 r0   c                 ~    | j                         ry t        | j                  | j                  | j                         y )N)download_rootmd5)r)   r   _URLr   _MD5r4   s    r/   r(   zRenderedSST2._downloadV   s)    $TYYdiiTYYWr0   )r   N)__name__
__module____qualname____doc__rE   rF   r	   r   r+   r   r   r   boolr   r"   intr5   tupler;   r=   r)   r(   __classcell__)r.   s   @r/   r   r   	   s    0 LD-D
 (,/3'5CI  H%	
 #8,  #$ 
2" "
s 
uS#X 
&C &t Xr0   r   N)pathlibr   typingr   r   r   r   folderr	   r
   utilsr   r   visionr   r    r0   r/   <module>rU      s'     1 1 0 ? !PX= PXr0   