From e4b6d3cb5c884210a2e299ece3e43c3f3355060d Mon Sep 17 00:00:00 2001 From: zschira Date: Thu, 19 Dec 2024 17:41:55 -0500 Subject: [PATCH] Fix row count asset check for vcerare --- src/pudl/transform/vcerare.py | 16 +++++++++++++--- 1 file changed, 13 insertions(+), 3 deletions(-) diff --git a/src/pudl/transform/vcerare.py b/src/pudl/transform/vcerare.py index 6ee9e6ce8..198677546 100644 --- a/src/pudl/transform/vcerare.py +++ b/src/pudl/transform/vcerare.py @@ -9,6 +9,7 @@ import pyarrow as pa import pyarrow.parquet as pq from dagster import ( + AssetCheckExecutionContext, AssetCheckResult, asset, asset_check, @@ -359,16 +360,25 @@ def _load_duckdb_table(): blocking=True, description="Check that row count matches expected.", ) -def check_rows() -> AssetCheckResult: +def check_rows(context: AssetCheckExecutionContext) -> AssetCheckResult: """Check rows.""" logger.info("Check VCE RARE hourly table is the expected length") + + # Define row counts for fast/full etl + row_counts = { + "etl_full": 136437000, + "etl_fast": 27287400, + } + vce = _load_duckdb_table() # noqa: F841 (length,) = duckdb.query("SELECT COUNT(*) FROM vce").fetchone() - if length != 136437000: + if ( + expecteded_length := row_counts[context.op_execution_context.job_name] + ) != length: return AssetCheckResult( passed=False, description="Table unexpected length", - metadata={"table_length": length, "expected_length": 136437000}, + metadata={"table_length": length, "expected_length": expecteded_length}, ) return AssetCheckResult(passed=True)