pola-rs · ritchie46 · Jun 22, 2024 · Jun 21, 2024 · Jun 21, 2024 · Jun 21, 2024
@@ -129,6 +129,9 @@ fn decompress_impl<R: Read>(
                     },
                 };
             }
+            if line_count == n_rows {
+                out.truncate(buf_pos); // retain only first n_rows in out
+            }
             out
         },
     })

@@ -213,7 +213,13 @@ string_pad = ["polars-lazy?/string_pad", "polars-ops/string_pad"]
 string_reverse = ["polars-lazy?/string_reverse", "polars-ops/string_reverse"]
 string_to_integer = ["polars-lazy?/string_to_integer", "polars-ops/string_to_integer"]
 take_opt_iter = ["polars-core/take_opt_iter"]
-timezones = ["polars-core/timezones", "polars-lazy?/timezones", "polars-io/timezones", "polars-sql?/timezones"]
+timezones = [
+  "polars-core/timezones",
+  "polars-lazy?/timezones",
+  "polars-io/timezones",
+  "polars-ops/timezones",
+  "polars-sql?/timezones",
+]
 to_dummies = ["polars-ops/to_dummies"]
 top_k = ["polars-lazy?/top_k"]
 trigonometry = ["polars-lazy?/trigonometry"]

@@ -2,7 +2,6 @@ use std::io::Cursor;
 use std::num::NonZeroUsize;
 
 use polars::io::RowIndex;
-use polars_core::export::chrono;
 use polars_core::utils::concat_df;
 
 use super::*;
@@ -41,7 +40,10 @@ fn write_csv() {
 }
 
 #[test]
+#[cfg(feature = "timezones")]
 fn write_dates() {
+    use polars_core::export::chrono;
+
     let s0 = Series::new("date", [chrono::NaiveDate::from_yo_opt(2024, 33), None]);
     let s1 = Series::new("time", [None, chrono::NaiveTime::from_hms_opt(19, 50, 0)]);
     let s2 = Series::new(
@@ -1389,3 +1391,16 @@ fn test_read_io_reader() {
     let expected = CsvReader::new(file).finish().unwrap();
     assert!(df.equals(&expected))
 }
+
+#[test]
+#[cfg(any(feature = "decompress", feature = "decompress-fast"))]
+fn test_read_compressed() {
+    const COMPRESSED_CSV: &str = "../../examples/datasets/compressed.csv.gz";
+    let df = CsvReadOptions::default()
+        .with_n_rows(Some(2367))
+        .try_into_reader_with_file_path(Some(COMPRESSED_CSV.into()))
+        .unwrap()
+        .finish()
+        .unwrap();
+    assert_eq!(df.shape(), (2367, 3));
+}
diff --git a/examples/datasets/compressed.csv.gz b/examples/datasets/compressed.csv.gz
-Original file line number
+Diff line change
@@ Expand Up / @@ -129,6 +129,9 @@ fn decompress_impl<R: Read>( @@
                         },
                     };
                 }
+                if line_count == n_rows {
+                    out.truncate(buf_pos); // retain only first n_rows in out
+                }
                 out
             },
         })
@@ Expand Down @@