Skip to content

WinoGrande

get_input_data_model()

Returns WinoGrande input data model.

Source code in synalinks/src/datasets/built_in/winogrande.py
@synalinks_export("synalinks.datasets.winogrande.get_input_data_model")
def get_input_data_model():
    """Returns WinoGrande input data model."""
    return WinoGrandeQuestion

get_output_data_model()

Returns WinoGrande output data model.

Source code in synalinks/src/datasets/built_in/winogrande.py
@synalinks_export("synalinks.datasets.winogrande.get_output_data_model")
def get_output_data_model():
    """Returns WinoGrande output data model."""
    return WinoGrandeAnswer

iterable_dataset(repeat=1, batch_size=1, limit=None, split='train')

Streaming dataset for RL-style training.

Returns:

Type Description
HuggingFaceDataset

A streaming, iterable dataset.

Source code in synalinks/src/datasets/built_in/winogrande.py
@synalinks_export("synalinks.datasets.winogrande.iterable_dataset")
def iterable_dataset(repeat=1, batch_size=1, limit=None, split="train"):
    """
    Streaming dataset for RL-style training.

    Returns:
        (HuggingFaceDataset): A streaming, iterable dataset.
    """
    return HuggingFaceDataset(
        path="allenai/winogrande",
        name="winogrande_xl",
        split=split,
        streaming=True,
        input_data_model=WinoGrandeQuestion,
        input_template=_INPUT_TEMPLATE,
        output_data_model=WinoGrandeAnswer,
        output_template=_OUTPUT_TEMPLATE,
        batch_size=batch_size,
        limit=limit,
        repeat=repeat,
    )

load_data()

Load WinoGrande (XL).

HF test split has no public labels, so we use train for training and validation for evaluation.

Returns:

Type Description
tuple

(x_train, y_train), (x_test, y_test).

Source code in synalinks/src/datasets/built_in/winogrande.py
@synalinks_export("synalinks.datasets.winogrande.load_data")
def load_data():
    """
    Load WinoGrande (XL).

    HF ``test`` split has no public labels, so we use ``train`` for
    training and ``validation`` for evaluation.

    Returns:
        (tuple): ``(x_train, y_train), (x_test, y_test)``.
    """
    x_train, y_train = _load("train")
    x_test, y_test = _load("validation")
    return (x_train, y_train), (x_test, y_test)