o
    bil                     @   s8   d dl Zd dlmZ eddg					d
dd	ZdS )    N)keras_exportzkeras.utils.pad_sequencesz*keras.preprocessing.sequence.pad_sequencesint32pre        c                 C   s  t | ds	tdt| }g }d}d}	| D ]3}
z|t|
 |	r1t|
r1t|
jdd }d}	W q tyH } z
tdt|
 |d}~ww |du rRt	|}t
|tjp_t
|tj}t|trx|turx|sxtd	| d
t| dtj||f| ||d}
t| D ]p\}}t|sq|dkr|| d }n|dkr|d| }ntd| dtj||d}|jdd |krtd|jdd  d| d| |dkr||
|dt|f< q|dkr||
|t| df< qtd| d|
S )a  Pads sequences to the same length.

    This function transforms a list (of length `num_samples`)
    of sequences (lists of integers)
    into a 2D NumPy array of shape `(num_samples, num_timesteps)`.
    `num_timesteps` is either the `maxlen` argument if provided,
    or the length of the longest sequence in the list.

    Sequences that are shorter than `num_timesteps`
    are padded with `value` until they are `num_timesteps` long.

    Sequences longer than `num_timesteps` are truncated
    so that they fit the desired length.

    The position where padding or truncation happens is determined by
    the arguments `padding` and `truncating`, respectively.
    Pre-padding or removing values from the beginning of the sequence is the
    default.

    >>> sequence = [[1], [2, 3], [4, 5, 6]]
    >>> keras.utils.pad_sequences(sequence)
    array([[0, 0, 1],
           [0, 2, 3],
           [4, 5, 6]], dtype=int32)

    >>> keras.utils.pad_sequences(sequence, value=-1)
    array([[-1, -1,  1],
           [-1,  2,  3],
           [ 4,  5,  6]], dtype=int32)

    >>> keras.utils.pad_sequences(sequence, padding='post')
    array([[1, 0, 0],
           [2, 3, 0],
           [4, 5, 6]], dtype=int32)

    >>> keras.utils.pad_sequences(sequence, maxlen=2)
    array([[0, 1],
           [2, 3],
           [5, 6]], dtype=int32)

    Args:
        sequences: List of sequences (each sequence is a list of integers).
        maxlen: Optional Int, maximum length of all sequences. If not provided,
            sequences will be padded to the length of the longest individual
            sequence.
        dtype: (Optional, defaults to `"int32"`). Type of the output sequences.
            To pad sequences with variable length strings, you can use `object`.
        padding: String, "pre" or "post" (optional, defaults to `"pre"`):
            pad either before or after each sequence.
        truncating: String, "pre" or "post" (optional, defaults to `"pre"`):
            remove values from sequences larger than
            `maxlen`, either at the beginning or at the end of the sequences.
        value: Float or String, padding value. (Optional, defaults to `0.`)

    Returns:
        NumPy array with shape `(len(sequences), maxlen)`
    __len__z`sequences` must be iterable. T   NFz=`sequences` must be a list of iterables. Found non-iterable: z`dtype` z( is not compatible with `value`'s type: z;
You should set `dtype=object` for variable length strings.)dtyper   postzTruncating type "z" not understoodzShape of sample z of sequence at position z" is different from expected shape zPadding type ")hasattr
ValueErrorlenappendnpasarrayshape	TypeErrorstrmax
issubdtypestr_
isinstanceobjecttypefull	enumerate)	sequencesmaxlenr	   padding
truncatingvaluenum_sampleslengthssample_shapeflagxeis_dtype_stridxstruncr   r   R/home/ubuntu/.local/lib/python3.10/site-packages/keras/src/utils/sequence_utils.pypad_sequences   st   
G
r,   )Nr   r   r   r   )numpyr   keras.src.api_exportr   r,   r   r   r   r+   <module>   s    