Source code for squadds.core.db_views
DEFAULT_COMPONENT_IMAGE_BASE_URL = "https://github.com/LFL-Lab/SQuADDS/tree/master/docs/_static/images"
[docs]
def build_dataset_rows(components, component_names, data_types, image_base_url=DEFAULT_COMPONENT_IMAGE_BASE_URL):
"""
Build the tabular dataset rows displayed by ``SQuADDS_DB.view_datasets``.
"""
component_urls = [f"{image_base_url}/{name}.png" for name in component_names]
rows = list(map(list, zip(components, component_names, data_types, component_urls)))
seen = set()
deduped_rows = []
for row in rows:
row_key = tuple(row)
if row_key in seen:
continue
seen.add(row_key)
deduped_rows.append(row)
return deduped_rows
[docs]
def describe_dataset(dataset):
"""
Collect the printable metadata fields for a Hugging Face dataset split.
"""
return {
"features": dataset.features,
"description": dataset.description,
"citation": dataset.citation,
"homepage": dataset.homepage,
"license": dataset.license,
"size_in_bytes": dataset.size_in_bytes,
}