pola-rs · sorhawell · Oct 20, 2023 · Oct 21, 2023 · Oct 23, 2023 · Oct 23, 2023
diff --git a/R/parquet.R b/R/parquet.R
@@ -14,7 +14,23 @@
 #' @name scan_parquet
 #' @rdname IO_scan_parquet
 #' @examples
-#' # TODO write parquet example
+#' #write example file
+#' my_parquet = tempfile(fileext = ".parquet")
+#' pl$LazyFrame(mtcars)$sink_parquet(my_parquet)
+#'
+#' # scan and get (project) only one column "cyl" but filter (apply predicate) on "hp".
+#' lf = pl$scan_parquet(my_parquet)$
+#'   filter(pl$col("hp") > 250)$
+#'   select(pl$col("cyl") * 2)
+#'
+#' # LayFrame with a logical plan (query)
+#' print(lf)
+#'
+#' # see optimized plan
+#' lf$describe_optimized_plan()
+#'
+#' # Execute and get result DataFrame
+#' lf$collect()
 pl$scan_parquet = function(
     file, # : str | Path,
     n_rows = NULL, # : int | None = None,
@@ -64,6 +80,13 @@ pl$scan_parquet = function(
 #' @param low_memory bool, try reduce memory footprint
 #' @return DataFrame
 #' @name read_parquet
+#' @examples
+#' # read parquet directly to DataFrame
+#' my_parquet = tempfile(fileext = ".parquet")
+#' pl$LazyFrame(mtcars)$sink_parquet(my_parquet)
+#' df = pl$read_parquet(my_parquet)
+#'
+#' print(df)
 pl$read_parquet = function(
     file,
     n_rows = NULL,
@@ -73,9 +96,26 @@ pl$read_parquet = function(
     row_count_name = NULL,
     row_count_offset = 0L,
     low_memory = FALSE) {
+
+  #construct a derived call
   mc = match.call()
   mc[[1]] = quote(pl$scan_parquet)
-  eval.parent(mc)$collect()
+
+  # eval call, and add to error context
+  mod_err_ctx = \(res) result(res) |> unwrap("in pl$read_parquet():")
+  lf = eval.parent(mc) |> mod_err_ctx()
+  lf$collect() |> mod_err_ctx()
+
+  # alternative style #1
+  # lf = pl$scan_parquet(...) |> mod_err_ctx()
+  # lf$collect() |> mod_err_ctx()
+
+  # alternative style #2
+  # pl$scan_parquet(...) |>
+  #  result() |>
+  #  and_then(\(lf) lf$collect()) |>
+  #  unwrap("in pl$read_parquet():")
+
 }
 
 

diff --git a/man/IO_read_parquet.Rd b/man/IO_read_parquet.Rd
diff --git a/man/IO_scan_parquet.Rd b/man/IO_scan_parquet.Rd
diff --git a/tests/testthat/test-parquet.R b/tests/testthat/test-parquet.R
@@ -0,0 +1,20 @@
+
+
+test_that("read_parquet", {
+  # throws an RPolarsRrror that attributes pl$read_parquet():
+  res = result(pl$read_parquet(42)) # should fail path as real is not allowed
+  expect_true(is_err(res))
+  err = res$err
+  expect_true(inherits(err,"RPolarsErr"))
+  expect_identical(res$err$get_rinfo(), "in pl$read_parquet():")
+})
+
+
+
+# # TODO! add unit tests for scan_parquet when function is refactored
+# test_that("scan_parquet", {
+#
+#
+#
+#
+# })