delta-io · wjones127 · Dec 1, 2022 · Nov 26, 2022 · Nov 26, 2022 · Nov 27, 2022
@@ -132,8 +132,28 @@ def write_deltalake(
     :param overwrite_schema: If True, allows updating the schema of the table.
     :param storage_options: options passed to the native delta filesystem. Unused if 'filesystem' is defined.
     """
+
     if _has_pandas and isinstance(data, pd.DataFrame):
-        data = pa.Table.from_pandas(data)
+        if schema is not None:
+            data = pa.Table.from_panda(data, schema=schema)
+        else:
+            _data = pa.Table.from_pandas(data)
+            _schema = _data.schema
+            schema_out = []
+            for _field in _schema:
+                # partially handles https://github.com/delta-io/delta-rs/issues/686
+                if isinstance(_field.type, pa.lib.TimestampType):
+                    f = pa.field(
+                        name=_field.name,
+                        type=pa.timestamp("us"),
+                        nullable=_field.nullable,
+                        metadata=_field.metadata,
+                    )
+                    schema_out.append(f)
+                else:
+                    schema_out.append(_field)
+            schema = pa.schema(schema_out, metadata=_schema.metadata)
+            data = pa.Table.from_pandas(data, schema=schema)
 
     if schema is None:
         if isinstance(data, RecordBatchReader):

@@ -275,9 +275,8 @@ def test_fails_wrong_partitioning(existing_table: DeltaTable, sample_data: pa.Ta
 def test_write_pandas(tmp_path: pathlib.Path, sample_data: pa.Table):
     # When timestamp is converted to Pandas, it gets casted to ns resolution,
     # but Delta Lake schemas only support us resolution.
-    sample_pandas = sample_data.to_pandas().drop(["timestamp"], axis=1)
+    sample_pandas = sample_data.to_pandas()
     write_deltalake(str(tmp_path), sample_pandas)
-
     delta_table = DeltaTable(str(tmp_path))
     df = delta_table.to_pandas()
     assert_frame_equal(df, sample_pandas)