File size: 438 Bytes
1719436
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3e35a01
 
 
1719436
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
import json

import datasets
import pandas as pd
import pandera.pandas as pa

from src.common.paths import DATASET_NAME
from src.common.schema import DatasetSchema


@pa.check_output(DatasetSchema)
def load_dataset() -> pd.DataFrame:
    ds = datasets.load_dataset(DATASET_NAME, split="test")
    df = pd.DataFrame(ds)

    df[DatasetSchema.correct_answer] = df[DatasetSchema.correct_answer].apply(
        json.loads
    )
    return df