From 26bc1cc9958157e17f88d1e314c9c3a7ffa7a294 Mon Sep 17 00:00:00 2001
From: zilto <tjean@DESKTOP-V6JDCS2>
Date: Wed, 17 Apr 2024 16:24:00 -0400
Subject: [PATCH] added pyarrow resultbuilder; updated dlt example

---
 examples/dlt/dlt_plugin.ipynb   | 200 ++++++++++++++++++++++++++------
 examples/dlt/requirements.txt   |   1 +
 hamilton/plugins/h_pyarrow.py   |  39 +++++++
 tests/plugins/test_h_pyarrow.py |  25 ++++
 4 files changed, 232 insertions(+), 33 deletions(-)
 create mode 100644 hamilton/plugins/h_pyarrow.py
 create mode 100644 tests/plugins/test_h_pyarrow.py
diff --git a/examples/dlt/dlt_plugin.ipynb b/examples/dlt/dlt_plugin.ipynb
index 032bff17c..2cc75a0cc 100644
--- a/examples/dlt/dlt_plugin.ipynb
+++ b/examples/dlt/dlt_plugin.ipynb
@@ -41,15 +41,15 @@
        "<!-- Generated by graphviz version 2.43.0 (0)\n",
        " -->\n",
        "<!-- Title: %3 Pages: 1 -->\n",
-       "<svg width=\"334pt\" height=\"285pt\"\n",
-       " viewBox=\"0.00 0.00 334.00 285.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
-       "<g id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 281)\">\n",
+       "<svg width=\"334pt\" height=\"367pt\"\n",
+       " viewBox=\"0.00 0.00 334.00 367.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
+       "<g id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 363)\">\n",
        "<title>%3</title>\n",
-       "<polygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-281 330,-281 330,4 -4,4\"/>\n",
+       "<polygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-363 330,-363 330,4 -4,4\"/>\n",
        "<g id=\"clust1\" class=\"cluster\">\n",
        "<title>cluster__legend</title>\n",
-       "<polygon fill=\"#ffffff\" stroke=\"black\" points=\"36.5,-137 36.5,-269 132.5,-269 132.5,-137 36.5,-137\"/>\n",
-       "<text text-anchor=\"middle\" x=\"84.5\" y=\"-253.8\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">Legend</text>\n",
+       "<polygon fill=\"#ffffff\" stroke=\"black\" points=\"36.5,-219 36.5,-351 132.5,-351 132.5,-219 36.5,-219\"/>\n",
+       "<text text-anchor=\"middle\" x=\"84.5\" y=\"-335.8\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">Legend</text>\n",
        "</g>\n",
        "<!-- table -->\n",
        "<g id=\"node1\" class=\"node\">\n",
@@ -58,43 +58,50 @@
        "<text text-anchor=\"start\" x=\"64\" y=\"-42.8\" font-family=\"Helvetica,sans-Serif\" font-weight=\"bold\" font-size=\"14.00\">table</text>\n",
        "<text text-anchor=\"start\" x=\"46\" y=\"-14.8\" font-family=\"Helvetica,sans-Serif\" font-style=\"italic\" font-size=\"14.00\">DataFrame</text>\n",
        "</g>\n",
-       "<!-- print_df_head -->\n",
+       "<!-- polars_table -->\n",
        "<g id=\"node2\" class=\"node\">\n",
+       "<title>polars_table</title>\n",
+       "<path fill=\"#b4d8e4\" stroke=\"black\" d=\"M132,-146C132,-146 37,-146 37,-146 31,-146 25,-140 25,-134 25,-134 25,-94 25,-94 25,-88 31,-82 37,-82 37,-82 132,-82 132,-82 138,-82 144,-88 144,-94 144,-94 144,-134 144,-134 144,-140 138,-146 132,-146\"/>\n",
+       "<text text-anchor=\"start\" x=\"36\" y=\"-124.8\" font-family=\"Helvetica,sans-Serif\" font-weight=\"bold\" font-size=\"14.00\">polars_table</text>\n",
+       "<text text-anchor=\"start\" x=\"46\" y=\"-96.8\" font-family=\"Helvetica,sans-Serif\" font-style=\"italic\" font-size=\"14.00\">DataFrame</text>\n",
+       "</g>\n",
+       "<!-- print_df_head -->\n",
+       "<g id=\"node3\" class=\"node\">\n",
        "<title>print_df_head</title>\n",
-       "<path fill=\"#b4d8e4\" stroke=\"black\" d=\"M314,-137C314,-137 210,-137 210,-137 204,-137 198,-131 198,-125 198,-125 198,-85 198,-85 198,-79 204,-73 210,-73 210,-73 314,-73 314,-73 320,-73 326,-79 326,-85 326,-85 326,-125 326,-125 326,-131 320,-137 314,-137\"/>\n",
-       "<text text-anchor=\"start\" x=\"209\" y=\"-115.8\" font-family=\"Helvetica,sans-Serif\" font-weight=\"bold\" font-size=\"14.00\">print_df_head</text>\n",
-       "<text text-anchor=\"start\" x=\"223.5\" y=\"-87.8\" font-family=\"Helvetica,sans-Serif\" font-style=\"italic\" font-size=\"14.00\">DataFrame</text>\n",
+       "<path fill=\"#b4d8e4\" stroke=\"black\" d=\"M314,-219C314,-219 210,-219 210,-219 204,-219 198,-213 198,-207 198,-207 198,-167 198,-167 198,-161 204,-155 210,-155 210,-155 314,-155 314,-155 320,-155 326,-161 326,-167 326,-167 326,-207 326,-207 326,-213 320,-219 314,-219\"/>\n",
+       "<text text-anchor=\"start\" x=\"209\" y=\"-197.8\" font-family=\"Helvetica,sans-Serif\" font-weight=\"bold\" font-size=\"14.00\">print_df_head</text>\n",
+       "<text text-anchor=\"start\" x=\"223.5\" y=\"-169.8\" font-family=\"Helvetica,sans-Serif\" font-style=\"italic\" font-size=\"14.00\">DataFrame</text>\n",
        "</g>\n",
        "<!-- _print_df_head_inputs -->\n",
-       "<g id=\"node3\" class=\"node\">\n",
+       "<g id=\"node4\" class=\"node\">\n",
        "<title>_print_df_head_inputs</title>\n",
-       "<polygon fill=\"#ffffff\" stroke=\"black\" stroke-dasharray=\"5,2\" points=\"169,-127.5 0,-127.5 0,-82.5 169,-82.5 169,-127.5\"/>\n",
-       "<text text-anchor=\"start\" x=\"15.5\" y=\"-100.8\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">external</text>\n",
-       "<text text-anchor=\"start\" x=\"78.5\" y=\"-100.8\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">DataFrame</text>\n",
+       "<polygon fill=\"#ffffff\" stroke=\"black\" stroke-dasharray=\"5,2\" points=\"169,-209.5 0,-209.5 0,-164.5 169,-164.5 169,-209.5\"/>\n",
+       "<text text-anchor=\"start\" x=\"15.5\" y=\"-182.8\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">external</text>\n",
+       "<text text-anchor=\"start\" x=\"78.5\" y=\"-182.8\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">DataFrame</text>\n",
        "</g>\n",
        "<!-- _print_df_head_inputs&#45;&gt;print_df_head -->\n",
        "<g id=\"edge1\" class=\"edge\">\n",
        "<title>_print_df_head_inputs&#45;&gt;print_df_head</title>\n",
-       "<path fill=\"none\" stroke=\"black\" d=\"M169.14,-105C175.36,-105 181.61,-105 187.76,-105\"/>\n",
-       "<polygon fill=\"black\" stroke=\"black\" points=\"188,-108.5 198,-105 188,-101.5 188,-108.5\"/>\n",
+       "<path fill=\"none\" stroke=\"black\" d=\"M169.14,-187C175.36,-187 181.61,-187 187.76,-187\"/>\n",
+       "<polygon fill=\"black\" stroke=\"black\" points=\"188,-190.5 198,-187 188,-183.5 188,-190.5\"/>\n",
        "</g>\n",
        "<!-- input -->\n",
-       "<g id=\"node4\" class=\"node\">\n",
+       "<g id=\"node5\" class=\"node\">\n",
        "<title>input</title>\n",
-       "<polygon fill=\"#ffffff\" stroke=\"black\" stroke-dasharray=\"5,2\" points=\"114,-237.5 55,-237.5 55,-200.5 114,-200.5 114,-237.5\"/>\n",
-       "<text text-anchor=\"middle\" x=\"84.5\" y=\"-215.3\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">input</text>\n",
+       "<polygon fill=\"#ffffff\" stroke=\"black\" stroke-dasharray=\"5,2\" points=\"114,-319.5 55,-319.5 55,-282.5 114,-282.5 114,-319.5\"/>\n",
+       "<text text-anchor=\"middle\" x=\"84.5\" y=\"-297.3\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">input</text>\n",
        "</g>\n",
        "<!-- function -->\n",
-       "<g id=\"node5\" class=\"node\">\n",
+       "<g id=\"node6\" class=\"node\">\n",
        "<title>function</title>\n",
-       "<path fill=\"#b4d8e4\" stroke=\"black\" d=\"M112.5,-182.5C112.5,-182.5 56.5,-182.5 56.5,-182.5 50.5,-182.5 44.5,-176.5 44.5,-170.5 44.5,-170.5 44.5,-157.5 44.5,-157.5 44.5,-151.5 50.5,-145.5 56.5,-145.5 56.5,-145.5 112.5,-145.5 112.5,-145.5 118.5,-145.5 124.5,-151.5 124.5,-157.5 124.5,-157.5 124.5,-170.5 124.5,-170.5 124.5,-176.5 118.5,-182.5 112.5,-182.5\"/>\n",
-       "<text text-anchor=\"middle\" x=\"84.5\" y=\"-160.3\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">function</text>\n",
+       "<path fill=\"#b4d8e4\" stroke=\"black\" d=\"M112.5,-264.5C112.5,-264.5 56.5,-264.5 56.5,-264.5 50.5,-264.5 44.5,-258.5 44.5,-252.5 44.5,-252.5 44.5,-239.5 44.5,-239.5 44.5,-233.5 50.5,-227.5 56.5,-227.5 56.5,-227.5 112.5,-227.5 112.5,-227.5 118.5,-227.5 124.5,-233.5 124.5,-239.5 124.5,-239.5 124.5,-252.5 124.5,-252.5 124.5,-258.5 118.5,-264.5 112.5,-264.5\"/>\n",
+       "<text text-anchor=\"middle\" x=\"84.5\" y=\"-242.3\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">function</text>\n",
        "</g>\n",
        "</g>\n",
        "</svg>\n"
       ],
       "text/plain": [
-       "<graphviz.graphs.Digraph at 0x7fddee552c50>"
+       "<graphviz.graphs.Digraph at 0x7f47dee61360>"
       ]
      },
      "execution_count": 2,
@@ -105,10 +112,14 @@
    "source": [
     "%%cell_to_module -m my_module -d\n",
     "import pandas as pd\n",
+    "import polars as pl\n",
     "\n",
     "def table() -> pd.DataFrame:\n",
     "    return pd.DataFrame([{\"C\": 1}, {\"C\": 2}])\n",
     "\n",
+    "def polars_table() -> pl.DataFrame:\n",
+    "    return pl.DataFrame([{\"C\": 1}, {\"C\": 2}])\n",
+    "\n",
     "def print_df_head(external: pd.DataFrame) -> pd.DataFrame:\n",
     "    print(\"from print_df_head:\\n\", external.head())"
    ]
@@ -161,7 +172,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "{'dlt_metadata': {'pipeline': {'pipeline_name': 'saver_pipe'}, 'metrics': [{'started_at': DateTime(2024, 4, 15, 20, 18, 40, 423767, tzinfo=Timezone('UTC')), 'finished_at': DateTime(2024, 4, 15, 20, 18, 40, 587988, tzinfo=Timezone('UTC')), 'load_id': '1713212320.0496533'}], 'destination_type': 'dlt.destinations.duckdb', 'destination_displayable_credentials': 'duckdb:////home/tjean/projects/dagworks/hamilton/examples/dlt/saver_pipe.duckdb', 'destination_name': 'duckdb', 'environment': None, 'staging_type': None, 'staging_name': None, 'staging_displayable_credentials': None, 'destination_fingerprint': '', 'dataset_name': 'saver_pipe_dataset', 'loads_ids': ['1713212320.0496533'], 'load_packages': [{'load_id': '1713212320.0496533', 'package_path': '/home/tjean/.dlt/pipelines/saver_pipe/load/loaded/1713212320.0496533', 'state': 'loaded', 'completed_at': DateTime(2024, 4, 15, 20, 18, 40, 570607, tzinfo=Timezone('UTC')), 'jobs': [{'state': 'completed_jobs', 'file_path': '/home/tjean/.dlt/pipelines/saver_pipe/load/loaded/1713212320.0496533/completed_jobs/my_table.7352fcd48a.0.parquet', 'file_size': 574, 'created_at': DateTime(2024, 4, 15, 20, 18, 40, 60607, tzinfo=Timezone('UTC')), 'elapsed': 0.5100002288818359, 'failed_message': None, 'table_name': 'my_table', 'file_id': '7352fcd48a', 'retry_count': 0, 'file_format': 'parquet'}], 'schema_hash': 'UE8l1iVz3xnHM+zYpjm8Bqd+3m6rDG++zNubWIUyecg=', 'schema_name': 'saver_pipe', 'tables': []}], 'first_run': False, 'started_at': DateTime(2024, 4, 15, 20, 18, 40, 423767, tzinfo=Timezone('UTC')), 'finished_at': DateTime(2024, 4, 15, 20, 18, 40, 587988, tzinfo=Timezone('UTC'))}}\n"
+      "{'dlt_metadata': {'pipeline': {'pipeline_name': 'saver_pipe'}, 'metrics': [{'started_at': DateTime(2024, 4, 17, 20, 22, 7, 283298, tzinfo=Timezone('UTC')), 'finished_at': DateTime(2024, 4, 17, 20, 22, 7, 453053, tzinfo=Timezone('UTC')), 'load_id': '1713385326.9071813'}], 'destination_type': 'dlt.destinations.duckdb', 'destination_displayable_credentials': 'duckdb:////home/tjean/projects/dagworks/hamilton/examples/dlt/saver_pipe.duckdb', 'destination_name': 'duckdb', 'environment': None, 'staging_type': None, 'staging_name': None, 'staging_displayable_credentials': None, 'destination_fingerprint': '', 'dataset_name': 'saver_pipe_dataset', 'loads_ids': ['1713385326.9071813'], 'load_packages': [{'load_id': '1713385326.9071813', 'package_path': '/home/tjean/.dlt/pipelines/saver_pipe/load/loaded/1713385326.9071813', 'state': 'loaded', 'completed_at': DateTime(2024, 4, 17, 20, 22, 7, 435481, tzinfo=Timezone('UTC')), 'jobs': [{'state': 'completed_jobs', 'file_path': '/home/tjean/.dlt/pipelines/saver_pipe/load/loaded/1713385326.9071813/completed_jobs/my_table.777bd2e418.0.parquet', 'file_size': 574, 'created_at': DateTime(2024, 4, 17, 20, 22, 6, 915481, tzinfo=Timezone('UTC')), 'elapsed': 0.5199999809265137, 'failed_message': None, 'table_name': 'my_table', 'file_id': '777bd2e418', 'retry_count': 0, 'file_format': 'parquet'}], 'schema_hash': 'UE8l1iVz3xnHM+zYpjm8Bqd+3m6rDG++zNubWIUyecg=', 'schema_name': 'saver_pipe', 'tables': []}], 'first_run': False, 'started_at': DateTime(2024, 4, 17, 20, 22, 7, 283298, tzinfo=Timezone('UTC')), 'finished_at': DateTime(2024, 4, 17, 20, 22, 7, 453053, tzinfo=Timezone('UTC'))}}\n"
      ]
     },
     {
@@ -227,7 +238,7 @@
        "</svg>\n"
       ],
       "text/plain": [
-       "<graphviz.graphs.Digraph at 0x7fddb41208e0>"
+       "<graphviz.graphs.Digraph at 0x7f47a81ebe80>"
       ]
      },
      "execution_count": 5,
@@ -249,6 +260,129 @@
     "dr.visualize_materialization(*materializers)"
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Alternative dataframe libraries\n",
+    "By default, dlt only supports Python `Iterable` of records (e.g., JSON objects), pandas (`pd.DataFrame`) and pyarrow (`pyarrow.Table`, `pyarrow.BatchedRecords`). To save a polars, dask, vaex, velox, or duckdb object, you would need to convert it to a supported type first.\n",
+    "\n",
+    "Hamilton provides adapter to make the process easy! Simply add the adapter to the `combine=` keyword of the data saver."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "{'dlt_metadata': {'pipeline': {'pipeline_name': 'saver_pipe'}, 'metrics': [{'started_at': DateTime(2024, 4, 17, 20, 22, 24, 280884, tzinfo=Timezone('UTC')), 'finished_at': DateTime(2024, 4, 17, 20, 22, 24, 447750, tzinfo=Timezone('UTC')), 'load_id': '1713385343.9070144'}], 'destination_type': 'dlt.destinations.duckdb', 'destination_displayable_credentials': 'duckdb:////home/tjean/projects/dagworks/hamilton/examples/dlt/saver_pipe.duckdb', 'destination_name': 'duckdb', 'environment': None, 'staging_type': None, 'staging_name': None, 'staging_displayable_credentials': None, 'destination_fingerprint': '', 'dataset_name': 'saver_pipe_dataset', 'loads_ids': ['1713385343.9070144'], 'load_packages': [{'load_id': '1713385343.9070144', 'package_path': '/home/tjean/.dlt/pipelines/saver_pipe/load/loaded/1713385343.9070144', 'state': 'loaded', 'completed_at': DateTime(2024, 4, 17, 20, 22, 24, 425481, tzinfo=Timezone('UTC')), 'jobs': [{'state': 'completed_jobs', 'file_path': '/home/tjean/.dlt/pipelines/saver_pipe/load/loaded/1713385343.9070144/completed_jobs/my_polars_table.a4e2d05d46.0.parquet', 'file_size': 574, 'created_at': DateTime(2024, 4, 17, 20, 22, 23, 915481, tzinfo=Timezone('UTC')), 'elapsed': 0.5099999904632568, 'failed_message': None, 'table_name': 'my_polars_table', 'file_id': 'a4e2d05d46', 'retry_count': 0, 'file_format': 'parquet'}], 'schema_hash': '4ezuw/Ke94mRLdyi/MbomA4EPL+AciFUjmfshpA07dU=', 'schema_name': 'saver_pipe', 'tables': []}], 'first_run': False, 'started_at': DateTime(2024, 4, 17, 20, 22, 24, 280884, tzinfo=Timezone('UTC')), 'finished_at': DateTime(2024, 4, 17, 20, 22, 24, 447750, tzinfo=Timezone('UTC'))}}\n"
+     ]
+    },
+    {
+     "data": {
+      "image/svg+xml": [
+       "<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?>\n",
+       "<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n",
+       " \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\n",
+       "<!-- Generated by graphviz version 2.43.0 (0)\n",
+       " -->\n",
+       "<!-- Title: %3 Pages: 1 -->\n",
+       "<svg width=\"626pt\" height=\"291pt\"\n",
+       " viewBox=\"0.00 0.00 626.00 291.00\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
+       "<g id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 287)\">\n",
+       "<title>%3</title>\n",
+       "<polygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-287 622,-287 622,4 -4,4\"/>\n",
+       "<g id=\"clust1\" class=\"cluster\">\n",
+       "<title>cluster__legend</title>\n",
+       "<polygon fill=\"#ffffff\" stroke=\"black\" points=\"8,-86 8,-275 129,-275 129,-86 8,-86\"/>\n",
+       "<text text-anchor=\"middle\" x=\"68.5\" y=\"-259.8\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">Legend</text>\n",
+       "</g>\n",
+       "<!-- polars_saver_node_build_result -->\n",
+       "<g id=\"node1\" class=\"node\">\n",
+       "<title>polars_saver_node_build_result</title>\n",
+       "<path fill=\"#b4d8e4\" stroke=\"black\" d=\"M410,-76C410,-76 169,-76 169,-76 163,-76 157,-70 157,-64 157,-64 157,-24 157,-24 157,-18 163,-12 169,-12 169,-12 410,-12 410,-12 416,-12 422,-18 422,-24 422,-24 422,-64 422,-64 422,-70 416,-76 410,-76\"/>\n",
+       "<text text-anchor=\"start\" x=\"168\" y=\"-54.8\" font-family=\"Helvetica,sans-Serif\" font-weight=\"bold\" font-size=\"14.00\">polars_saver_node_build_result</text>\n",
+       "<text text-anchor=\"start\" x=\"271\" y=\"-26.8\" font-family=\"Helvetica,sans-Serif\" font-style=\"italic\" font-size=\"14.00\">Table</text>\n",
+       "</g>\n",
+       "<!-- polars_saver_node -->\n",
+       "<g id=\"node3\" class=\"node\">\n",
+       "<title>polars_saver_node</title>\n",
+       "<path fill=\"#ffc857\" stroke=\"black\" d=\"M618,-80C618,-84.41 580.57,-88 534.5,-88 488.43,-88 451,-84.41 451,-80 451,-80 451,-8 451,-8 451,-3.59 488.43,0 534.5,0 580.57,0 618,-3.59 618,-8 618,-8 618,-80 618,-80\"/>\n",
+       "<path fill=\"none\" stroke=\"black\" d=\"M618,-80C618,-75.59 580.57,-72 534.5,-72 488.43,-72 451,-75.59 451,-80\"/>\n",
+       "<text text-anchor=\"start\" x=\"462\" y=\"-54.8\" font-family=\"Helvetica,sans-Serif\" font-weight=\"bold\" font-size=\"14.00\">polars_saver_node</text>\n",
+       "<text text-anchor=\"start\" x=\"465\" y=\"-26.8\" font-family=\"Helvetica,sans-Serif\" font-style=\"italic\" font-size=\"14.00\">DltDestinationSaver</text>\n",
+       "</g>\n",
+       "<!-- polars_saver_node_build_result&#45;&gt;polars_saver_node -->\n",
+       "<g id=\"edge2\" class=\"edge\">\n",
+       "<title>polars_saver_node_build_result&#45;&gt;polars_saver_node</title>\n",
+       "<path fill=\"none\" stroke=\"black\" d=\"M422.31,-44C428.53,-44 434.71,-44 440.79,-44\"/>\n",
+       "<polygon fill=\"black\" stroke=\"black\" points=\"440.92,-47.5 450.92,-44 440.92,-40.5 440.92,-47.5\"/>\n",
+       "</g>\n",
+       "<!-- polars_table -->\n",
+       "<g id=\"node2\" class=\"node\">\n",
+       "<title>polars_table</title>\n",
+       "<path fill=\"#b4d8e4\" stroke=\"black\" d=\"M116,-76C116,-76 21,-76 21,-76 15,-76 9,-70 9,-64 9,-64 9,-24 9,-24 9,-18 15,-12 21,-12 21,-12 116,-12 116,-12 122,-12 128,-18 128,-24 128,-24 128,-64 128,-64 128,-70 122,-76 116,-76\"/>\n",
+       "<text text-anchor=\"start\" x=\"20\" y=\"-54.8\" font-family=\"Helvetica,sans-Serif\" font-weight=\"bold\" font-size=\"14.00\">polars_table</text>\n",
+       "<text text-anchor=\"start\" x=\"30\" y=\"-26.8\" font-family=\"Helvetica,sans-Serif\" font-style=\"italic\" font-size=\"14.00\">DataFrame</text>\n",
+       "</g>\n",
+       "<!-- polars_table&#45;&gt;polars_saver_node_build_result -->\n",
+       "<g id=\"edge1\" class=\"edge\">\n",
+       "<title>polars_table&#45;&gt;polars_saver_node_build_result</title>\n",
+       "<path fill=\"none\" stroke=\"black\" d=\"M128.19,-44C134.09,-44 140.25,-44 146.56,-44\"/>\n",
+       "<polygon fill=\"black\" stroke=\"black\" points=\"146.6,-47.5 156.6,-44 146.6,-40.5 146.6,-47.5\"/>\n",
+       "</g>\n",
+       "<!-- function -->\n",
+       "<g id=\"node4\" class=\"node\">\n",
+       "<title>function</title>\n",
+       "<path fill=\"#b4d8e4\" stroke=\"black\" d=\"M96.5,-243.5C96.5,-243.5 40.5,-243.5 40.5,-243.5 34.5,-243.5 28.5,-237.5 28.5,-231.5 28.5,-231.5 28.5,-218.5 28.5,-218.5 28.5,-212.5 34.5,-206.5 40.5,-206.5 40.5,-206.5 96.5,-206.5 96.5,-206.5 102.5,-206.5 108.5,-212.5 108.5,-218.5 108.5,-218.5 108.5,-231.5 108.5,-231.5 108.5,-237.5 102.5,-243.5 96.5,-243.5\"/>\n",
+       "<text text-anchor=\"middle\" x=\"68.5\" y=\"-221.3\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">function</text>\n",
+       "</g>\n",
+       "<!-- output -->\n",
+       "<g id=\"node5\" class=\"node\">\n",
+       "<title>output</title>\n",
+       "<path fill=\"#ffc857\" stroke=\"black\" d=\"M90.5,-188.5C90.5,-188.5 46.5,-188.5 46.5,-188.5 40.5,-188.5 34.5,-182.5 34.5,-176.5 34.5,-176.5 34.5,-163.5 34.5,-163.5 34.5,-157.5 40.5,-151.5 46.5,-151.5 46.5,-151.5 90.5,-151.5 90.5,-151.5 96.5,-151.5 102.5,-157.5 102.5,-163.5 102.5,-163.5 102.5,-176.5 102.5,-176.5 102.5,-182.5 96.5,-188.5 90.5,-188.5\"/>\n",
+       "<text text-anchor=\"middle\" x=\"68.5\" y=\"-166.3\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">output</text>\n",
+       "</g>\n",
+       "<!-- materializer -->\n",
+       "<g id=\"node6\" class=\"node\">\n",
+       "<title>materializer</title>\n",
+       "<path fill=\"#ffffff\" stroke=\"black\" d=\"M121,-130.26C121,-132.26 97.47,-133.88 68.5,-133.88 39.53,-133.88 16,-132.26 16,-130.26 16,-130.26 16,-97.74 16,-97.74 16,-95.74 39.53,-94.12 68.5,-94.12 97.47,-94.12 121,-95.74 121,-97.74 121,-97.74 121,-130.26 121,-130.26\"/>\n",
+       "<path fill=\"none\" stroke=\"black\" d=\"M121,-130.26C121,-128.27 97.47,-126.65 68.5,-126.65 39.53,-126.65 16,-128.27 16,-130.26\"/>\n",
+       "<text text-anchor=\"middle\" x=\"68.5\" y=\"-110.3\" font-family=\"Helvetica,sans-Serif\" font-size=\"14.00\">materializer</text>\n",
+       "</g>\n",
+       "</g>\n",
+       "</svg>\n"
+      ],
+      "text/plain": [
+       "<graphviz.graphs.Digraph at 0x7f4799119b10>"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "from hamilton.plugins import h_pyarrow\n",
+    "\n",
+    "materializers = [\n",
+    "    to.dlt(\n",
+    "        id=\"polars_saver_node\",\n",
+    "        dependencies=[\"polars_table\"],\n",
+    "        combine=h_pyarrow.PyarrowTableResult(),\n",
+    "        table_name=\"my_polars_table\",\n",
+    "        pipeline=saver_pipeline,\n",
+    "    )\n",
+    "]\n",
+    "results, _ = dr.materialize(*materializers)\n",
+    "print(results[\"polars_saver_node\"])\n",
+    "dr.visualize_materialization(*materializers)"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},
@@ -261,7 +395,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -289,7 +423,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 9,
    "metadata": {},
    "outputs": [
     {
@@ -297,12 +431,12 @@
      "output_type": "stream",
      "text": [
       "from print_df_head:\n",
-      "    col       _dlt_load_id         _dlt_id\n",
-      "0    1  1713212320.641402  vG/cmM5Ty/F/WQ\n",
-      "1    2  1713212320.641402  xZ/tUsoBiWTneQ\n",
-      "2    3  1713212320.641402  d+8Ah9hx2214Vw\n",
-      "3    1  1713212320.641402  XxYKANM6PlMl2A\n",
-      "4    2  1713212320.641402  jnnYhXp5KA2NsQ\n"
+      "    col        _dlt_load_id         _dlt_id\n",
+      "0    1  1713385353.1057432  nV52FbDDaG8Hng\n",
+      "1    2  1713385353.1057432  1PnuRBfd/pFmbg\n",
+      "2    3  1713385353.1057432  E29IvCLX2o0hBw\n",
+      "3    1  1713385353.1057432  PHnW5pOvp3WRmA\n",
+      "4    2  1713385353.1057432  oRTCJeKpMP2OCQ\n"
      ]
     }
    ],
diff --git a/examples/dlt/requirements.txt b/examples/dlt/requirements.txt
index 2662e32d1..ea9a32ac5 100644
--- a/examples/dlt/requirements.txt
+++ b/examples/dlt/requirements.txt
@@ -2,5 +2,6 @@ dlt[duckdb]>=0.3.12
 ibis-framework[duckdb]
 openai
 pandas
+polars
 sf-hamilton[visualization]
 streamlit
diff --git a/hamilton/plugins/h_pyarrow.py b/hamilton/plugins/h_pyarrow.py
new file mode 100644
index 000000000..2600634b2
--- /dev/null
+++ b/hamilton/plugins/h_pyarrow.py
@@ -0,0 +1,39 @@
+from typing import Any, Type
+
+import pyarrow
+from pyarrow.interchange import from_dataframe
+
+from hamilton.lifecycle.api import ResultBuilder
+
+
+class PyarrowTableResult(ResultBuilder):
+    """Add this result builder to a materializer's `combine` statement to convert your dataframe
+    object to a pyarrow representation and make it compatible with pyarrow DataSavers.
+
+    It implicitly support input_type == Any, but it expects dataframe objects implementing
+    the dataframe interchange protocol: ref: https://arrow.apache.org/docs/python/interchange_protocol.html
+    for example:
+    - pandas
+    - polars
+    - dask
+    - vaex
+    - ibis
+    - duckdb results
+    """
+
+    def output_type(self) -> Type:
+        return pyarrow.Table
+
+    def build_result(self, **outputs: Any) -> Any:
+        """This function converts objects implementing the `__dataframe__` protocol to
+        a pyarrow table. It doesn't support receiving multiple outputs because it can't
+        handle any joining logic.
+
+        ref: https://arrow.apache.org/docs/python/interchange_protocol.html
+        """
+        if len(outputs) != 1:
+            raise AssertionError(
+                "PyarrowTableResult can only receive 1 output, i.e., only one item in `to.SAVER(dependencies=[])`"
+                f"It received {len(outputs)} outputs."
+            )
+        return from_dataframe(next(iter(outputs.values())))
diff --git a/tests/plugins/test_h_pyarrow.py b/tests/plugins/test_h_pyarrow.py
new file mode 100644
index 000000000..8b32a551a
--- /dev/null
+++ b/tests/plugins/test_h_pyarrow.py
@@ -0,0 +1,25 @@
+import pandas as pd
+import pyarrow
+import pytest
+
+from hamilton.plugins import h_pyarrow
+
+
+@pytest.fixture()
+def pandas():
+    return pd.DataFrame({"a": [0, 1, 2], "b": ["a", "b", "c"]})
+
+
+def test_pandas_to_pyarrow(pandas):
+    result_builder = h_pyarrow.PyarrowTableResult()
+    data = {"df": pandas}
+    # ResultBuilder receive unpacked dict as arg, i.e., kwargs only
+    table = result_builder.build_result(**data)
+    assert isinstance(table, pyarrow.Table)
+
+
+def test_fail_for_multiple_outputs(pandas):
+    result_builder = h_pyarrow.PyarrowTableResult()
+    data = {"df": pandas, "df2": pandas}
+    with pytest.raises(AssertionError):
+        result_builder.build_result(**data)