| | import logging |
| |
|
| | import datasets |
| |
|
| |
|
| | def check_dataset_and_get_config(dataset_id): |
| | try: |
| | configs = datasets.get_dataset_config_names(dataset_id) |
| | return configs |
| | except Exception: |
| | |
| | return None |
| |
|
| |
|
| | def check_dataset_and_get_split(dataset_id, dataset_config): |
| | try: |
| | ds = datasets.load_dataset(dataset_id, dataset_config) |
| | except Exception as e: |
| | |
| | logging.warning( |
| | f"Failed to load dataset {dataset_id} with config {dataset_config}: {e}" |
| | ) |
| | return None |
| | try: |
| | splits = list(ds.keys()) |
| | return splits |
| | except Exception as e: |
| | |
| | logging.warning( |
| | f"Dataset {dataset_id} with config {dataset_config} has no splits: {e}" |
| | ) |
| | return None |
| |
|