diff --git a/docs/content/_navigation.json b/docs/content/_navigation.json
index e2e64c085f04d..1aaf086194832 100644
--- a/docs/content/_navigation.json
+++ b/docs/content/_navigation.json
@@ -295,6 +295,10 @@
"title": "Asset metadata",
"path": "/concepts/metadata-tags/asset-metadata"
},
+ {
+ "title": "Table metadata",
+ "path": "/concepts/metadata-tags/asset-metadata/table-metadata"
+ },
{
"title": "Column-level lineage",
"path": "/concepts/metadata-tags/asset-metadata/column-level-lineage"
@@ -1547,4 +1551,4 @@
}
]
}
-]
\ No newline at end of file
+]
diff --git a/docs/content/api/modules.json.gz b/docs/content/api/modules.json.gz
index d86286e573b31..3704ed246e40f 100644
Binary files a/docs/content/api/modules.json.gz and b/docs/content/api/modules.json.gz differ
diff --git a/docs/content/api/searchindex.json.gz b/docs/content/api/searchindex.json.gz
index 59db04171ae4b..8e2a93b543da1 100644
Binary files a/docs/content/api/searchindex.json.gz and b/docs/content/api/searchindex.json.gz differ
diff --git a/docs/content/api/sections.json.gz b/docs/content/api/sections.json.gz
index 5b024ce370382..66c5ed30d73f1 100644
Binary files a/docs/content/api/sections.json.gz and b/docs/content/api/sections.json.gz differ
diff --git a/docs/content/concepts/metadata-tags/asset-metadata.mdx b/docs/content/concepts/metadata-tags/asset-metadata.mdx
index 24b8c3741db27..86ea2311cea04 100644
--- a/docs/content/concepts/metadata-tags/asset-metadata.mdx
+++ b/docs/content/concepts/metadata-tags/asset-metadata.mdx
@@ -28,7 +28,7 @@ Dagster supports attaching a few different types of definition metadata:
- [**Arbitrary metadata**](#arbitrary-metadata-using-the-metadata-parameter), such as the storage location of the table produced by the asset
- [**Asset owners**](#asset-owners), which are the people and/or teams who own the asset
-- [**Column-level lineage**](#column-level-lineage), which is information about how a column is created and used
+- [**Table metadata**](#table-metadata), which provides additional context about a tabular asset, such as its schema or row count
### Arbitrary metadata using the metadata parameter
@@ -129,9 +129,9 @@ def topstories(context: AssetExecutionContext) -> MaterializeResult:
)
```
-### Column-level lineage
+### Table metadata
-For assets that produce database tables, column-level lineage can be a powerful tool for improving collaboration and debugging issues. Column lineage enables data and analytics engineers alike to understand how a column is created and used in your data platform. Refer to the [Column-level lineage documentation](/concepts/metadata-tags/asset-metadata/column-level-lineage) for more information.
+For assets which produce database tables, you can attach table metadata to provide additional context about the asset. Table metadata can include information such as the schema, row count, or column lineage. Refer to the [Table metadata documentation](/concepts/metadata-tags/asset-metadata/table-metadata) for more information.
---
diff --git a/docs/content/concepts/metadata-tags/asset-metadata/table-metadata.mdx b/docs/content/concepts/metadata-tags/asset-metadata/table-metadata.mdx
new file mode 100644
index 0000000000000..7c4cfeece58ae
--- /dev/null
+++ b/docs/content/concepts/metadata-tags/asset-metadata/table-metadata.mdx
@@ -0,0 +1,192 @@
+---
+title: "Table metadata | Dagster Docs"
+description: "Table metadata can be used to provide additional context about a tabular asset, such as its schema, row count, and more."
+---
+
+# Table metadata
+
+Table metadata provides additional context about a tabular asset, such as its schema, row count, and more. This metadata can be used to improve collaboration, debugging, and data quality in your data platform.
+
+Dagster supports attaching different types of table metadata to assets, including:
+
+- [**Column schema**](#attaching-column-schema): Describes the structure of the table, including column names and types
+- [**Row count**](#attaching-row-count): Describes the number of rows in a materialized table
+- [**Column-level lineage**](#attaching-column-level-lineage): Describes how a column is created and used by other assets
+
+---
+
+## Attaching column schema
+
+### For assets defined in Dagster
+
+
+
+You may attach column schema metadata to Dagster assets either as [definition metadata](/concepts/metadata-tags/asset-metadata#attaching-definition-metadata) or [materialization metadata](/concepts/metadata-tags/asset-metadata#attaching-materialization-metadata). If the schema of your asset is pre-defined, you can attach it as definition metadata. If the schema is only known when an asset is materialized, you can attach it as metadata to that materialization.
+
+To attach schema metadata to an asset, you will need to:
+
+1. Construct a object with entries describing each column in the table
+2. Attach the `TableSchema` object to the asset as part of the `metadata` parameter under the `dagster/column_schema` key. This can be attached to your asset definition, or to the object returned by the asset function
+
+Below are two examples of how to attach column schema metadata to an asset, one as definition metadata and one as materialization metadata:
+
+```python file=/concepts/metadata-tags/asset_column_schema.py
+from dagster import AssetKey, MaterializeResult, TableColumn, TableSchema, asset
+
+
+# Here, we know the schema of the asset, so we can attach it to the asset decorator
+@asset(
+ deps=[AssetKey("source_bar"), AssetKey("source_baz")],
+ metadata={
+ "dagster/column_schema": TableSchema(
+ columns=[
+ TableColumn(
+ "name",
+ "string",
+ description="The name of the person",
+ ),
+ TableColumn(
+ "age",
+ "int",
+ description="The age of the person",
+ ),
+ ]
+ )
+ },
+)
+def my_asset(): ...
+
+
+# Here, the schema isn't known until runtime
+@asset(deps=[AssetKey("source_bar"), AssetKey("source_baz")])
+def my_other_asset():
+ column_names = ...
+ column_types = ...
+
+ columns = [
+ TableColumn(name, column_type)
+ for name, column_type in zip(column_names, column_types)
+ ]
+
+ yield MaterializeResult(
+ metadata={"dagster/column_schema": TableSchema(columns=columns)}
+ )
+```
+
+The schema for `my_asset` will be visible in the Dagster UI. You may optionally attach to each column to provide additional context about the values in the column:
+
+```python file=/concepts/metadata-tags/asset_column_schema_constraints.py
+from dagster import (
+ AssetKey,
+ MaterializeResult,
+ TableColumn,
+ TableColumnConstraints,
+ TableSchema,
+ asset,
+)
+
+
+@asset(
+ deps=[AssetKey("source_bar"), AssetKey("source_baz")],
+ metadata={
+ "dagster/column_schema": TableSchema(
+ columns=[
+ TableColumn(
+ "name",
+ "string",
+ description="The name of the person",
+ ),
+ TableColumn(
+ "age",
+ "int",
+ description="The age of the person",
+ constraints=TableColumnConstraints(nullable=False, other=[">0"]),
+ ),
+ ]
+ )
+ },
+)
+def my_asset(): ...
+```
+
+### For assets loaded from integrations
+
+Column schemas are currently supported in the dbt integration. Refer to the [dbt documentation](/integrations/dbt/reference) for more information.
+
+---
+
+## Attaching row count
+
+### For assets defined in Dagster
+
+
+
+You may attach row count schema metadata to Dagster assets as [materialization metadata](/concepts/metadata-tags/asset-metadata#attaching-materialization-metadata) to provide additional context about the number of rows in a materialized table. Dagster will let you track changes in the row count over time, and you can use this information to monitor data quality.
+
+To attach schema metadata to an asset, you will need to attach a numerical value to the `dagster/row_count` key in the metadata parameter of the object returned by the asset function.
+
+Below is an example of how to attach row count metadata to an asset:
+
+```python file=/concepts/metadata-tags/asset_row_count.py
+import pandas as pd
+
+from dagster import AssetKey, MaterializeResult, asset
+
+
+@asset(deps=[AssetKey("source_bar"), AssetKey("source_baz")])
+def my_asset():
+ my_df: pd.DataFrame = ...
+
+ yield MaterializeResult(metadata={"dagster/row_count": 374})
+```
+
+---
+
+## Attaching column-level lineage
+
+Column lineage enables data and analytics engineers alike to understand how a column is created and used in your data platform. Refer to the [Column-level lineage documentation](/concepts/metadata-tags/asset-metadata/column-level-lineage) for more information.
+
+---
+
+## APIs in this guide
+
+| Name | Description |
+| -------------------------------------------- | ---------------------------------------------------------------- |
+| | A decorator used to define assets. |
+| | An object representing a successful materialization of an asset. |
+| | An object representing the schema of a tabular asset. |
+| | Class that defines column information for a tabular asset. |
+| | Class that defines constraints for a column in a tabular asset. |
+
+---
+
+## Related
+
+
+
+
+
+
+
diff --git a/docs/next/public/images/concepts/metadata-tags/metadata-row-count.png b/docs/next/public/images/concepts/metadata-tags/metadata-row-count.png
new file mode 100644
index 0000000000000..e79fd08420742
Binary files /dev/null and b/docs/next/public/images/concepts/metadata-tags/metadata-row-count.png differ
diff --git a/docs/next/public/images/concepts/metadata-tags/metadata-table-schema.png b/docs/next/public/images/concepts/metadata-tags/metadata-table-schema.png
new file mode 100644
index 0000000000000..d799be20dde31
Binary files /dev/null and b/docs/next/public/images/concepts/metadata-tags/metadata-table-schema.png differ
diff --git a/docs/next/public/objects.inv b/docs/next/public/objects.inv
index 12cc04710fe3b..f15f1638ed48b 100644
Binary files a/docs/next/public/objects.inv and b/docs/next/public/objects.inv differ
diff --git a/examples/docs_snippets/docs_snippets/concepts/metadata-tags/asset_column_schema.py b/examples/docs_snippets/docs_snippets/concepts/metadata-tags/asset_column_schema.py
new file mode 100644
index 0000000000000..409a73c629091
--- /dev/null
+++ b/examples/docs_snippets/docs_snippets/concepts/metadata-tags/asset_column_schema.py
@@ -0,0 +1,40 @@
+from dagster import AssetKey, MaterializeResult, TableColumn, TableSchema, asset
+
+
+# Here, we know the schema of the asset, so we can attach it to the asset decorator
+@asset(
+ deps=[AssetKey("source_bar"), AssetKey("source_baz")],
+ metadata={
+ "dagster/column_schema": TableSchema(
+ columns=[
+ TableColumn(
+ "name",
+ "string",
+ description="The name of the person",
+ ),
+ TableColumn(
+ "age",
+ "int",
+ description="The age of the person",
+ ),
+ ]
+ )
+ },
+)
+def my_asset(): ...
+
+
+# Here, the schema isn't known until runtime
+@asset(deps=[AssetKey("source_bar"), AssetKey("source_baz")])
+def my_other_asset():
+ column_names = ...
+ column_types = ...
+
+ columns = [
+ TableColumn(name, column_type)
+ for name, column_type in zip(column_names, column_types)
+ ]
+
+ yield MaterializeResult(
+ metadata={"dagster/column_schema": TableSchema(columns=columns)}
+ )
diff --git a/examples/docs_snippets/docs_snippets/concepts/metadata-tags/asset_column_schema_constraints.py b/examples/docs_snippets/docs_snippets/concepts/metadata-tags/asset_column_schema_constraints.py
new file mode 100644
index 0000000000000..49dddd44e7a95
--- /dev/null
+++ b/examples/docs_snippets/docs_snippets/concepts/metadata-tags/asset_column_schema_constraints.py
@@ -0,0 +1,31 @@
+from dagster import (
+ AssetKey,
+ MaterializeResult,
+ TableColumn,
+ TableColumnConstraints,
+ TableSchema,
+ asset,
+)
+
+
+@asset(
+ deps=[AssetKey("source_bar"), AssetKey("source_baz")],
+ metadata={
+ "dagster/column_schema": TableSchema(
+ columns=[
+ TableColumn(
+ "name",
+ "string",
+ description="The name of the person",
+ ),
+ TableColumn(
+ "age",
+ "int",
+ description="The age of the person",
+ constraints=TableColumnConstraints(nullable=False, other=[">0"]),
+ ),
+ ]
+ )
+ },
+)
+def my_asset(): ...
diff --git a/examples/docs_snippets/docs_snippets/concepts/metadata-tags/asset_row_count.py b/examples/docs_snippets/docs_snippets/concepts/metadata-tags/asset_row_count.py
new file mode 100644
index 0000000000000..40d50a5e768d2
--- /dev/null
+++ b/examples/docs_snippets/docs_snippets/concepts/metadata-tags/asset_row_count.py
@@ -0,0 +1,10 @@
+import pandas as pd
+
+from dagster import AssetKey, MaterializeResult, asset
+
+
+@asset(deps=[AssetKey("source_bar"), AssetKey("source_baz")])
+def my_asset():
+ my_df: pd.DataFrame = ...
+
+ yield MaterializeResult(metadata={"dagster/row_count": 374})
diff --git a/python_modules/dagster-test/dagster_test/toys/table_metadata.py b/python_modules/dagster-test/dagster_test/toys/table_metadata.py
index 57a6264bc949d..2aba3de1c07a0 100644
--- a/python_modules/dagster-test/dagster_test/toys/table_metadata.py
+++ b/python_modules/dagster-test/dagster_test/toys/table_metadata.py
@@ -40,6 +40,29 @@
)
-@asset(metadata={"resident_info": table_metadata})
+@asset(
+ metadata={
+ "dagster/column_schema": TableSchema(
+ columns=[
+ TableColumn("name", "string", description="The name of the person"),
+ TableColumn(
+ "age",
+ "int",
+ description="The age of the person",
+ ),
+ TableColumn(
+ "height",
+ "float",
+ description="The height of the person in centimeters",
+ ),
+ TableColumn(
+ "is_resident",
+ "bool",
+ description="Whether the person is a resident of the city",
+ ),
+ ]
+ ),
+ }
+)
def alpha():
return 1