{% set pit_schema = collection.get("taco:pit_schema", collection.get("pit_schema", {})) %} {% set field_schema = collection.get("taco:field_schema", collection.get("field_schema", {})) %} {% set sources = collection.get("taco:sources", {}) %} {% set extent = collection.get("extent", {}) %} {{ collection.get("title", collection.get("id", "TACO Dataset")) }} {% if inline_deps %} {% else %} {% endif %}
{% if catalogue_url %} Back to Catalogue {% endif %}
TACO DATASET DOCUMENTATION

{{ collection.get("title", collection.get("id", "Untitled Dataset")) }}

v{{ collection.get("dataset_version", "1.0.0") }} {{ collection.get("id", "unknown") }} {% if collection.get("licenses") %}{{ collection.get("licenses", [])|join(", ") }}{% endif %}

Description

{{ description_html|safe }}

Dataset Overview

{% if sources %}
{{ sources["count"] }} partitions {% if extent.get("temporal") %} {{ extent["temporal"][0][:4] }} - {{ extent["temporal"][1][:4] }} temporal coverage {% endif %}

Spatial Coverage

Click on any region to view partition details

{% endif %} {% if collection.get("keywords") %}

Keywords

{% for keyword in collection["keywords"] %} {{ keyword }} {% endfor %}
{% endif %} {% if collection.get("tasks") %}

ML Tasks

{% for task in collection["tasks"] %} {{ task }} {% endfor %}
{% endif %}
{% if pit_schema %}

TACO Structure (Position-Invariant Tree)

Hierarchical structure showing representative samples across levels. The "..." notation indicates additional samples following the same pattern. All samples at the same level share identical structure (PIT constraint).

Hierarchy Details

{% set root = pit_schema.get("root", {}) %} {% if pit_schema.get("hierarchy") %} {% for level, patterns in pit_schema["hierarchy"].items()|sort %} {% for pattern in patterns %} {% endfor %} {% endfor %} {% endif %}
Level Types Total Samples Sample IDs (preview)
Level 0 All {{ root.get("type", "UNKNOWN") }} {{ "{:,}".format(root.get("n", 0)) }} Root level samples
Level {{ level }} {% if pattern.get("type", [])|length == 1 %}All {{ pattern["type"][0] }}{% else %}{{ pattern.get("type", [])|join(" + ") }}{% endif %} {{ "{:,}".format(pattern.get("n", 0)) }} {{ pattern.get("id", [])[:3]|join(", ") }}{% if pattern.get("id", [])|length > 3 %}...{% endif %}
{% endif %} {% if field_schema %}

Metadata Fields by Level

These fields are available for querying with SQL when using TacoReader.

{% for level, fields in field_schema.items()|sort %}
{{ level.upper() }} ({{ fields|length }} fields)
{% for field in fields %} {% endfor %}
Field Name Type Description
{{ field[0] }} {{ field[1] }} {% if field|length > 2 and field[2] %}{{ field[2] }}{% else %}No description{% endif %}
{% endfor %}
{% endif %}

Loading the Dataset

# pip install tacotoolbox
import tacoreader

# Load dataset
ds = tacoreader.load("{{ collection.get('id', 'dataset') }}.tacozip")

# Basic info
print(f"ID: {ds.id}")
print(f"Version: {ds.version}")
print(f"Samples: {len(ds.data)}")
{% if collection.get("providers") or collection.get("curators") %}

Providers & Curators

{% if collection.get("providers") %}

Data Providers

{% for provider in collection["providers"] %}
{{ provider.get("name", "Unknown") }}
{% if provider.get("roles") %}
{% for role in provider["roles"] %} {{ role }} {% endfor %}
{% endif %}
{% endfor %} {% endif %} {% if collection.get("curators") %}

Dataset Curators

{% for curator in collection["curators"] %}
{{ curator.get("name", "Unknown") }}
{% if curator.get("roles") %}
{% for role in curator["roles"] %} {{ role }} {% endfor %}
{% endif %} {% if curator.get("organization") %}
{{ curator["organization"] }}
{% endif %} {% if curator.get("email") %}
{{ curator["email"] }}
{% endif %}
{% endfor %} {% endif %}
{% endif %}

Publications & Citations

How to Cite This Dataset

If you use this dataset in your research, please cite:

{% if collection.get("publications:list") %} {% for pub in collection["publications:list"] %}
{% if pub.get("doi") %}{% endif %} {% if pub.get("citation") %}
{{ pub['citation'] }}
{% endif %}
{% endfor %} {% else %}

No publications specified

{% endif %}

BibTeX

@dataset{ {{- collection.get("id", "dataset") -}} {{ collection.get("dataset_version", "2024").split(".")[0] }},
  title = { {{- collection.get("title", collection.get("id", "Dataset")) -}} },
  author = { 
    {%- if collection.get("curators") -%}
      {{ collection["curators"]|map(attribute='name')|join(' and ') }}
    {%- else -%}
      Unknown
    {%- endif -%}
  },
  year = { 
    {%- if extent.get("temporal") -%}
      {{ extent["temporal"][0][:4] }}
    {%- else -%}
      2024
    {%- endif -%}
  },
  version = { {{- collection.get("dataset_version", "1.0.0") -}} },
  publisher = { 
    {%- if collection.get("curators") and collection["curators"][0].get("organization") -%}
      {{ collection["curators"][0]["organization"] }}
    {%- else -%}
      Unknown
    {%- endif -%}
  }
}
{% if inline_deps %} {% else %} {% endif %} {% if js_map %}{% endif %}