
    ͑i(                     4    S SK Jr  S SKJr  / r " S S5      rg)    )text_format)data_feed_pb2c                   6    \ rS rSrSrS rS rS rS rS r	Sr
g	)
DataFeedDesc   at  
:api_attr: Static Graph

Datafeed descriptor, describing input training data format.

DataFeedDesc shall be initialized from a valid protobuf message from disk.

See :code:`paddle/base/framework/data_feed.proto` for message definition.
A typical message might look like:

Examples:
    .. code-block:: python

        >>> import paddle.base as base
        >>> with open("data.proto", "w") as f:
        ...     f.write('name: "MultiSlotDataFeed"\n')
        ...     f.write('batch_size: 2\n')
        ...     f.write('multi_slot_desc {\n')
        ...     f.write('    slots {\n')
        ...     f.write('        name: "words"\n')
        ...     f.write('        type: "uint64"\n')
        ...     f.write('        is_dense: false\n')
        ...     f.write('        is_used: true\n')
        ...     f.write('    }\n')
        ...     f.write('    slots {\n')
        ...     f.write('        name: "label"\n')
        ...     f.write('        type: "uint64"\n')
        ...     f.write('        is_dense: false\n')
        ...     f.write('        is_used: true\n')
        ...     f.write('    }\n')
        ...     f.write('}')
        >>> data_feed = base.DataFeedDesc('data.proto')

    However, users usually shouldn't care about the message format; instead,
    they are encouraged to use :code:`Data Generator` as a tool to generate a
    valid data description, in the process of converting their raw log files to
    training files acceptable to Executor.

    DataFeedDesc can also be changed during runtime. Once you got familiar with
    what each field mean, you can modify it to better suit your need. E.g.:

    .. code-block:: python

        >>> import paddle.base as base
        >>> data_feed = base.DataFeedDesc('data.proto')
        >>> data_feed.set_batch_size(128)
        >>> data_feed.set_dense_slots(['words'])  # The slot named 'words' will be dense
        >>> data_feed.set_use_slots(['words'])    # The slot named 'words' will be used

        >>> # Finally, the content can be dumped out for debugging purpose:

        >>> print(data_feed.desc())

Args:
    proto_file(string): Disk file containing a data feed description.

c                    [         R                  " 5       U l        SU R                  l        [	        US5       n[
        R                  " UR                  5       U R                  5        S S S 5        U R                  R                  S:X  aO  [        U R                  R                  R                  5       VVs0 s H  u  p4UR                  U_M     snnU l        g g ! , (       d  f       Nx= fs  snnf )NcatrMultiSlotDataFeed)r   r   
proto_descpipe_commandopenr   Parsereadname	enumeratemulti_slot_descslots_DataFeedDesc__name_to_index)self
proto_filefislots        Z/var/www/html/banglarbhumi/venv/lib/python3.13/site-packages/paddle/base/data_feed_desc.py__init__DataFeedDesc.__init__Q   s    '446',$*c"aaffh8 #??#66  ))H)H)N)NO$OGA 		1O$D  7 #"$s   0C6C+
C(c                 $    XR                   l        g)a|  
Set :attr:`batch_size` in ``paddle.base.DataFeedDesc`` . :attr:`batch_size` can be changed during training.

Examples:
    .. code-block:: python

        >>> import paddle.base as base
        >>> with open("data.proto", "w") as f:
        ...     f.write('name: "MultiSlotDataFeed"\n')
        ...     f.write('batch_size: 2\n')
        ...     f.write('multi_slot_desc {\n')
        ...     f.write('    slots {\n')
        ...     f.write('        name: "words"\n')
        ...     f.write('        type: "uint64"\n')
        ...     f.write('        is_dense: false\n')
        ...     f.write('        is_used: true\n')
        ...     f.write('    }\n')
        ...     f.write('    slots {\n')
        ...     f.write('        name: "label"\n')
        ...     f.write('        type: "uint64"\n')
        ...     f.write('        is_dense: false\n')
        ...     f.write('        is_used: true\n')
        ...     f.write('    }\n')
        ...     f.write('}')
        >>> data_feed = base.DataFeedDesc('data.proto')
        >>> data_feed.set_batch_size(128)

Args:
    batch_size (int): The number of batch size.

Returns:
    None.

N)r   
batch_size)r   r   s     r   set_batch_sizeDataFeedDesc.set_batch_size\   s    F &0"    c                     U R                   R                  S:w  a  [        S5      eU H8  nSU R                   R                  R                  U R
                  U      l        M:     g)a  
Set slots in :attr:`dense_slots_name` as dense slots. **Note: In default, all slots are sparse slots.**

Features for a dense slot will be fed into a Tensor, while those for a
sparse slot will be fed into a DenseTensor.

Examples:
    .. code-block:: python

        >>> import paddle.base as base
        >>> with open("data.proto", "w") as f:
        ...     f.write('name: "MultiSlotDataFeed"\n')
        ...     f.write('batch_size: 2\n')
        ...     f.write('multi_slot_desc {\n')
        ...     f.write('    slots {\n')
        ...     f.write('        name: "words"\n')
        ...     f.write('        type: "uint64"\n')
        ...     f.write('        is_dense: false\n')
        ...     f.write('        is_used: true\n')
        ...     f.write('    }\n')
        ...     f.write('    slots {\n')
        ...     f.write('        name: "label"\n')
        ...     f.write('        type: "uint64"\n')
        ...     f.write('        is_dense: false\n')
        ...     f.write('        is_used: true\n')
        ...     f.write('    }\n')
        ...     f.write('}')
        >>> data_feed = base.DataFeedDesc('data.proto')
        >>> data_feed.set_dense_slots(['words'])

Args:
    dense_slots_name (list(str)): a list of slot names which will be set dense.

Returns:
    None.

r   zNOnly MultiSlotDataFeed needs set_dense_slots, please check your datafeed.protoTN)r   r   
ValueErrorr   r   r   is_dense)r   dense_slots_namer   s      r   set_dense_slotsDataFeedDesc.set_dense_slots   sd    L ??#66`  %D  OO++11$$T* %r"   c                     U R                   R                  S:w  a  [        S5      eU H8  nSU R                   R                  R                  U R
                  U      l        M:     g)a  
Set if a specific slot will be used for training. A dataset shall
contain a lot of features, through this function one can select which
ones will be used for a specific model.

Examples:
    .. code-block:: python

        >>> import paddle.base as base
        >>> with open("data.proto", "w") as f:
        ...     f.write('name: "MultiSlotDataFeed"\n')
        ...     f.write('batch_size: 2\n')
        ...     f.write('multi_slot_desc {\n')
        ...     f.write('    slots {\n')
        ...     f.write('        name: "words"\n')
        ...     f.write('        type: "uint64"\n')
        ...     f.write('        is_dense: false\n')
        ...     f.write('        is_used: true\n')
        ...     f.write('    }\n')
        ...     f.write('    slots {\n')
        ...     f.write('        name: "label"\n')
        ...     f.write('        type: "uint64"\n')
        ...     f.write('        is_dense: false\n')
        ...     f.write('        is_used: true\n')
        ...     f.write('    }\n')
        ...     f.write('}')
        >>> data_feed = base.DataFeedDesc('data.proto')
        >>> data_feed.set_use_slots(['words'])

Args:
    use_slots_name: a list of slot names which will be used in training

Note:
    Default is not used for all slots
r   zLOnly MultiSlotDataFeed needs set_use_slots, please check your datafeed.protoTN)r   r   r$   r   r   r   is_used)r   use_slots_namer   s      r   set_use_slotsDataFeedDesc.set_use_slots   sd    H ??#66^  #D  OO++11$$T* #r"   c                 B    [         R                  " U R                  5      $ )a  
Returns a protobuf message for this DataFeedDesc

Examples:
    .. code-block:: python

        >>> import paddle.base as base
        >>> with open("data.proto", "w") as f:
        ...     f.write('name: "MultiSlotDataFeed"\n')
        ...     f.write('batch_size: 2\n')
        ...     f.write('multi_slot_desc {\n')
        ...     f.write('    slots {\n')
        ...     f.write('        name: "words"\n')
        ...     f.write('        type: "uint64"\n')
        ...     f.write('        is_dense: false\n')
        ...     f.write('        is_used: true\n')
        ...     f.write('    }\n')
        ...     f.write('    slots {\n')
        ...     f.write('        name: "label"\n')
        ...     f.write('        type: "uint64"\n')
        ...     f.write('        is_dense: false\n')
        ...     f.write('        is_used: true\n')
        ...     f.write('    }\n')
        ...     f.write('}')
        >>> data_feed = base.DataFeedDesc('data.proto')
        >>> print(data_feed.desc())

Returns:
    A string message
)r   MessageToStringr   )r   s    r   descDataFeedDesc.desc   s    > **4??;;r"   )__name_to_indexr   N)__name__
__module____qualname____firstlineno____doc__r   r    r'   r,   r0   __static_attributes__ r"   r   r   r      s$    8t	#0J-^+Z<r"   r   N)google.protobufr   paddle.base.protor   __all__r   r9   r"   r   <module>r=      s    ( +
f< f<r"   