diff --git a/src/datasets/packaged_modules/folder_based_builder/folder_based_builder.py b/src/datasets/packaged_modules/folder_based_builder/folder_based_builder.py index 5626a28afd2..6c96d402aa1 100644 --- a/src/datasets/packaged_modules/folder_based_builder/folder_based_builder.py +++ b/src/datasets/packaged_modules/folder_based_builder/folder_based_builder.py @@ -2,7 +2,7 @@ import itertools import os from dataclasses import dataclass -from typing import Any, List, Optional, Tuple +from typing import List, Optional, Tuple import pandas as pd import pyarrow as pa @@ -10,6 +10,7 @@ import pyarrow.json as paj import datasets +from datasets.features.features import FeatureType from datasets.tasks.base import TaskTemplate @@ -66,7 +67,7 @@ class FolderBasedBuilder(datasets.GeneratorBasedBuilder): CLASSIFICATION_TASK: classification task to use if labels are obtained from the folder structure """ - BASE_FEATURE: Any + BASE_FEATURE: FeatureType BASE_COLUMN_NAME: str BUILDER_CONFIG_CLASS: FolderBasedBuilderConfig EXTENSIONS: List[str] diff --git a/tests/packaged_modules/test_folder_based_builder.py b/tests/packaged_modules/test_folder_based_builder.py index a7017ea054c..34fe3a62db7 100644 --- a/tests/packaged_modules/test_folder_based_builder.py +++ b/tests/packaged_modules/test_folder_based_builder.py @@ -11,6 +11,7 @@ FolderBasedBuilder, FolderBasedBuilderConfig, ) +from datasets.tasks import TextClassification class DummyFolderBasedBuilder(FolderBasedBuilder): @@ -18,7 +19,7 @@ class DummyFolderBasedBuilder(FolderBasedBuilder): BASE_COLUMN_NAME = "base" BUILDER_CONFIG_CLASS = FolderBasedBuilderConfig EXTENSIONS = [".txt"] - CLASSIFICATION_TASK = None + CLASSIFICATION_TASK = TextClassification(text_column="base", label_column="label") @pytest.fixture