|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
""" Logging utilities. """ |
|
|
|
|
|
import logging |
|
|
logging.basicConfig(format='%(asctime)s - %(levelname)s - %(name)s - %(message)s', datefmt='%m/%d/%Y %H:%M:%S', level=logging.WARN) |
|
|
|
|
|
import os |
|
|
from logging import ( |
|
|
CRITICAL, |
|
|
DEBUG, |
|
|
ERROR, |
|
|
FATAL, |
|
|
INFO, |
|
|
NOTSET, |
|
|
WARN, |
|
|
WARNING, |
|
|
) |
|
|
from typing import Optional |
|
|
from tqdm import auto as tqdm_lib |
|
|
|
|
|
|
|
|
log_levels = { |
|
|
"debug": logging.DEBUG, |
|
|
"info": logging.INFO, |
|
|
"warning": logging.WARNING, |
|
|
"error": logging.ERROR, |
|
|
"critical": logging.CRITICAL, |
|
|
} |
|
|
|
|
|
_default_log_level = logging.INFO |
|
|
|
|
|
|
|
|
def _get_default_logging_level(): |
|
|
""" |
|
|
If DATASETS_VERBOSITY env var is set to one of the valid choices return that as the new default level. |
|
|
If it is not - fall back to ``_default_log_level`` |
|
|
""" |
|
|
env_level_str = os.getenv("DATASETS_VERBOSITY", None) |
|
|
if env_level_str: |
|
|
if env_level_str in log_levels: |
|
|
return log_levels[env_level_str] |
|
|
else: |
|
|
logging.getLogger().warning( |
|
|
f"Unknown option DATASETS_VERBOSITY={env_level_str}, " |
|
|
f"has to be one of: { ', '.join(log_levels.keys()) }" |
|
|
) |
|
|
return _default_log_level |
|
|
|
|
|
|
|
|
def _get_library_name() -> str: |
|
|
return __name__.split(".")[0] |
|
|
|
|
|
|
|
|
def _get_root_logger() -> logging.Logger: |
|
|
|
|
|
return logging.getLogger() |
|
|
|
|
|
|
|
|
def _configure_root_logger() -> None: |
|
|
|
|
|
root_logger = _get_root_logger() |
|
|
|
|
|
root_logger.setLevel(_get_default_logging_level()) |
|
|
|
|
|
|
|
|
def _reset_root_logger() -> None: |
|
|
root_logger = _get_root_logger() |
|
|
root_logger.setLevel(logging.NOTSET) |
|
|
|
|
|
|
|
|
def get_logger(name: Optional[str] = None) -> logging.Logger: |
|
|
"""Return a logger with the specified name. |
|
|
This function can be used in dataset scripts. |
|
|
""" |
|
|
if name is None: |
|
|
name = _get_library_name() |
|
|
return logging.getLogger(name) |
|
|
|
|
|
|
|
|
def get_verbosity() -> int: |
|
|
"""Return the current level for the HuggingFace datasets library's root logger. |
|
|
Returns: |
|
|
Logging level, e.g., `datasets.logging.DEBUG` and `datasets.logging.INFO`. |
|
|
|
|
|
<Tip> |
|
|
|
|
|
HuggingFace datasets library has following logging levels: |
|
|
- `datasets.logging.CRITICAL`, `datasets.logging.FATAL` |
|
|
- `datasets.logging.ERROR` |
|
|
- `datasets.logging.WARNING`, `datasets.logging.WARN` |
|
|
- `datasets.logging.INFO` |
|
|
- `datasets.logging.DEBUG` |
|
|
|
|
|
</Tip> |
|
|
""" |
|
|
return _get_root_logger().getEffectiveLevel() |
|
|
|
|
|
|
|
|
def set_verbosity(verbosity: int) -> None: |
|
|
"""Set the level for the HuggingFace Datasets library's root logger. |
|
|
Args: |
|
|
verbosity: |
|
|
Logging level, e.g., `datasets.logging.DEBUG` and `datasets.logging.INFO`. |
|
|
""" |
|
|
_get_root_logger().setLevel(verbosity) |
|
|
|
|
|
|
|
|
def set_verbosity_info(): |
|
|
"""Set the level for the HuggingFace datasets library's root logger to `INFO`. |
|
|
|
|
|
This will display most of the logging information and tqdm bars. |
|
|
|
|
|
Shortcut to `datasets.logging.set_verbosity(datasets.logging.INFO)`. |
|
|
""" |
|
|
return set_verbosity(INFO) |
|
|
|
|
|
|
|
|
def set_verbosity_warning(): |
|
|
"""Set the level for the HuggingFace datasets library's root logger to `WARNING`. |
|
|
|
|
|
This will display only the warning and errors logging information and tqdm bars. |
|
|
|
|
|
Shortcut to `datasets.logging.set_verbosity(datasets.logging.WARNING)`. |
|
|
""" |
|
|
return set_verbosity(WARNING) |
|
|
|
|
|
|
|
|
def set_verbosity_debug(): |
|
|
"""Set the level for the HuggingFace datasets library's root logger to `DEBUG`. |
|
|
|
|
|
This will display all the logging information and tqdm bars. |
|
|
|
|
|
Shortcut to `datasets.logging.set_verbosity(datasets.logging.DEBUG)`. |
|
|
""" |
|
|
return set_verbosity(DEBUG) |
|
|
|
|
|
|
|
|
def set_verbosity_error(): |
|
|
"""Set the level for the HuggingFace datasets library's root logger to `ERROR`. |
|
|
|
|
|
This will display only the errors logging information and tqdm bars. |
|
|
|
|
|
Shortcut to `datasets.logging.set_verbosity(datasets.logging.ERROR)`. |
|
|
""" |
|
|
return set_verbosity(ERROR) |
|
|
|
|
|
|
|
|
def disable_propagation() -> None: |
|
|
"""Disable propagation of the library log outputs. |
|
|
Note that log propagation is disabled by default. |
|
|
""" |
|
|
_get_root_logger().propagate = False |
|
|
|
|
|
|
|
|
def enable_propagation() -> None: |
|
|
"""Enable propagation of the library log outputs. |
|
|
Please disable the HuggingFace datasets library's default handler to prevent double logging if the root logger has |
|
|
been configured. |
|
|
""" |
|
|
_get_root_logger().propagate = True |
|
|
|
|
|
|
|
|
|
|
|
_configure_root_logger() |
|
|
|
|
|
|
|
|
class EmptyTqdm: |
|
|
"""Dummy tqdm which doesn't do anything.""" |
|
|
|
|
|
def __init__(self, *args, **kwargs): |
|
|
self._iterator = args[0] if args else None |
|
|
|
|
|
def __iter__(self): |
|
|
return iter(self._iterator) |
|
|
|
|
|
def __getattr__(self, _): |
|
|
"""Return empty function.""" |
|
|
|
|
|
def empty_fn(*args, **kwargs): |
|
|
return |
|
|
|
|
|
return empty_fn |
|
|
|
|
|
def __enter__(self): |
|
|
return self |
|
|
|
|
|
def __exit__(self, type_, value, traceback): |
|
|
return |
|
|
|
|
|
|
|
|
_tqdm_active = True |
|
|
|
|
|
|
|
|
class _tqdm_cls: |
|
|
def __call__(self, *args, disable=False, **kwargs): |
|
|
if _tqdm_active and not disable: |
|
|
return tqdm_lib.tqdm(*args, **kwargs) |
|
|
else: |
|
|
return EmptyTqdm(*args, **kwargs) |
|
|
|
|
|
def set_lock(self, *args, **kwargs): |
|
|
self._lock = None |
|
|
if _tqdm_active: |
|
|
return tqdm_lib.tqdm.set_lock(*args, **kwargs) |
|
|
|
|
|
def get_lock(self): |
|
|
if _tqdm_active: |
|
|
return tqdm_lib.tqdm.get_lock() |
|
|
|
|
|
def __delattr__(self, attr): |
|
|
"""fix for https://github.com/huggingface/datasets/issues/6066""" |
|
|
try: |
|
|
del self.__dict__[attr] |
|
|
except KeyError: |
|
|
if attr != "_lock": |
|
|
raise AttributeError(attr) |
|
|
|
|
|
|
|
|
tqdm = _tqdm_cls() |
|
|
|
|
|
|
|
|
def is_progress_bar_enabled() -> bool: |
|
|
"""Return a boolean indicating whether tqdm progress bars are enabled.""" |
|
|
global _tqdm_active |
|
|
return bool(_tqdm_active) |
|
|
|
|
|
|
|
|
def enable_progress_bar(): |
|
|
"""Enable tqdm progress bar.""" |
|
|
global _tqdm_active |
|
|
_tqdm_active = True |
|
|
|
|
|
|
|
|
def disable_progress_bar(): |
|
|
"""Disable tqdm progress bar.""" |
|
|
global _tqdm_active |
|
|
_tqdm_active = False |