(arrow-adbc) branch main updated: docs(r): Update READMEs for R packages (#1707)

lidavidm Wed, 03 Apr 2024 13:27:03 -0700

This is an automated email from the ASF dual-hosted git repository.

lidavidm pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/arrow-adbc.git



The following commit(s) were added to refs/heads/main by this push:
     new aa1990bb1 docs(r): Update READMEs for R packages (#1707)
aa1990bb1 is described below

commit aa1990bb155f053b8ed4e20b49b04421a0c8a205
Author: Dewey Dunnington <[email protected]>
AuthorDate: Wed Apr 3 17:26:53 2024 -0300

    docs(r): Update READMEs for R packages (#1707)
    
    Just a pass through all the READMEs to generally align them with how
    people are most likely to interact with them at first glance!
---
 r/adbcdrivermanager/README.Rmd | 29 +++++++++--------------------
 r/adbcdrivermanager/README.md  | 38 ++++++++++++++------------------------
 r/adbcpostgresql/README.Rmd    | 10 +++-------
 r/adbcpostgresql/README.md     | 18 +++++++-----------
 r/adbcsqlite/README.Rmd        | 22 +++++++++-------------
 r/adbcsqlite/README.md         | 28 ++++++++++++----------------
 6 files changed, 54 insertions(+), 91 deletions(-)

diff --git a/r/adbcdrivermanager/README.Rmd b/r/adbcdrivermanager/README.Rmd
index 439268cb8..4384c8b4a 100644
--- a/r/adbcdrivermanager/README.Rmd
+++ b/r/adbcdrivermanager/README.Rmd
@@ -70,33 +70,22 @@ library(adbcdrivermanager)
 
 # Get a reference to a database using a driver. The adbcdrivermanager package
 # contains a few drivers useful for illustration and testing.
-db <- adbc_database_init(adbc_driver_monkey())
+db <- adbc_database_init(adbcsqlite::adbcsqlite())
 
 # Open a new connection to a database
 con <- adbc_connection_init(db)
 
-# Initialize a new statement from a connection
-stmt <- adbc_statement_init(con)
+# Write a table
+nycflights13::flights |> write_adbc(con, "flights")
 
-# The monkey driver allows you to specify the data for a query
-# in advance for testing purposes
-adbc_statement_bind_stream(stmt, nycflights13::flights)
-
-# Set the query
-adbc_statement_set_sql_query(stmt, "SELECT * FROM flights")
-
-# Start executing the query. Results in ADBC are ArrowArrayStream objects,
-# which can be materialized using as.data.frame(), as_tibble(),
-# or converted to an arrow::RecordBatchReader using
-# arrow::as_record_batch_reader()
-stream <- nanoarrow::nanoarrow_allocate_array_stream()
-adbc_statement_execute_query(stmt, stream)
-
-# Materialize the whole query as a tibble
-tibble::as_tibble(stream)
+# Issue a query
+con |>
+  read_adbc("SELECT * from flights") |>
+  tibble::as_tibble()
 
 # Clean up!
-adbc_statement_release(stmt)
 adbc_connection_release(con)
 adbc_database_release(db)
 ```
+
+One can also interact with the driver manager at a lower level using 
`adbc_connection_*()` and `adbc_statement_*()` functions (see reference 
documentation for details).
diff --git a/r/adbcdrivermanager/README.md b/r/adbcdrivermanager/README.md
index 231fc8a48..387f64c2f 100644
--- a/r/adbcdrivermanager/README.md
+++ b/r/adbcdrivermanager/README.md
@@ -62,34 +62,21 @@ library(adbcdrivermanager)
 
 # Get a reference to a database using a driver. The adbcdrivermanager package
 # contains a few drivers useful for illustration and testing.
-db <- adbc_database_init(adbc_driver_monkey())
+db <- adbc_database_init(adbcsqlite::adbcsqlite())
 
 # Open a new connection to a database
 con <- adbc_connection_init(db)
 
-# Initialize a new statement from a connection
-stmt <- adbc_statement_init(con)
+# Write a table
+nycflights13::flights |> write_adbc(con, "flights")
 
-# The monkey driver allows you to specify the data for a query
-# in advance for testing purposes
-adbc_statement_bind_stream(stmt, nycflights13::flights)
-
-# Set the query
-adbc_statement_set_sql_query(stmt, "SELECT * FROM flights")
-
-# Start executing the query. Results in ADBC are ArrowArrayStream objects,
-# which can be materialized using as.data.frame(), as_tibble(),
-# or converted to an arrow::RecordBatchReader using
-# arrow::as_record_batch_reader()
-stream <- nanoarrow::nanoarrow_allocate_array_stream()
-adbc_statement_execute_query(stmt, stream)
-#> [1] -1
-
-# Materialize the whole query as a tibble
-tibble::as_tibble(stream)
+# Issue a query
+con |>
+  read_adbc("SELECT * from flights") |>
+  tibble::as_tibble()
 #> # A tibble: 336,776 × 19
 #>     year month   day dep_time sched_dep_time dep_delay arr_time 
sched_arr_time
-#>    <int> <int> <int>    <int>          <int>     <dbl>    <int>          
<int>
+#>    <dbl> <dbl> <dbl>    <dbl>          <dbl>     <dbl>    <dbl>          
<dbl>
 #>  1  2013     1     1      517            515         2      830            
819
 #>  2  2013     1     1      533            529         4      850            
830
 #>  3  2013     1     1      542            540         2      923            
850
@@ -101,12 +88,15 @@ tibble::as_tibble(stream)
 #>  9  2013     1     1      557            600        -3      838            
846
 #> 10  2013     1     1      558            600        -2      753            
745
 #> # ℹ 336,766 more rows
-#> # ℹ 11 more variables: arr_delay <dbl>, carrier <chr>, flight <int>,
+#> # ℹ 11 more variables: arr_delay <dbl>, carrier <chr>, flight <dbl>,
 #> #   tailnum <chr>, origin <chr>, dest <chr>, air_time <dbl>, distance <dbl>,
-#> #   hour <dbl>, minute <dbl>, time_hour <dttm>
+#> #   hour <dbl>, minute <dbl>, time_hour <chr>
 
 # Clean up!
-adbc_statement_release(stmt)
 adbc_connection_release(con)
 adbc_database_release(db)
 ```
+
+One can also interact with the driver manager at a lower level using
+`adbc_connection_*()` and `adbc_statement_*()` functions (see reference
+documentation for details).
diff --git a/r/adbcpostgresql/README.Rmd b/r/adbcpostgresql/README.Rmd
index cc68887b2..b94915c16 100644
--- a/r/adbcpostgresql/README.Rmd
+++ b/r/adbcpostgresql/README.Rmd
@@ -73,20 +73,16 @@ db <- adbc_database_init(adbcpostgresql::adbcpostgresql(), 
uri = uri)
 con <- adbc_connection_init(db)
 
 # Write a table
-flights <- head(nycflights13::flights, 100)
-# (timestamp not supported yet)
-flights$time_hour <- NULL
-flights |>
-  write_adbc(con, "flights")
+nycflights13::flights |> write_adbc(con, "flights")
 
-# Query it
+# Issue a query
 con |>
   read_adbc("SELECT * from flights") |>
   tibble::as_tibble()
 ```
 
 ```{r example-clean-up}
-# Clean up
+# Clean up!
 con |>
   execute_adbc("DROP TABLE flights")
 adbc_connection_release(con)
diff --git a/r/adbcpostgresql/README.md b/r/adbcpostgresql/README.md
index b902cc8c1..96112aada 100644
--- a/r/adbcpostgresql/README.md
+++ b/r/adbcpostgresql/README.md
@@ -64,17 +64,13 @@ db <- adbc_database_init(adbcpostgresql::adbcpostgresql(), 
uri = uri)
 con <- adbc_connection_init(db)
 
 # Write a table
-flights <- head(nycflights13::flights, 100)
-# (timestamp not supported yet)
-flights$time_hour <- NULL
-flights |>
-  write_adbc(con, "flights")
+nycflights13::flights |> write_adbc(con, "flights")
 
-# Query it
+# Issue a query
 con |>
   read_adbc("SELECT * from flights") |>
   tibble::as_tibble()
-#> # A tibble: 100 × 18
+#> # A tibble: 336,776 × 19
 #>     year month   day dep_time sched_dep_time dep_delay arr_time 
sched_arr_time
 #>    <int> <int> <int>    <int>          <int>     <dbl>    <int>          
<int>
 #>  1  2013     1     1      517            515         2      830            
819
@@ -87,14 +83,14 @@ con |>
 #>  8  2013     1     1      557            600        -3      709            
723
 #>  9  2013     1     1      557            600        -3      838            
846
 #> 10  2013     1     1      558            600        -2      753            
745
-#> # ℹ 90 more rows
-#> # ℹ 10 more variables: arr_delay <dbl>, carrier <chr>, flight <int>,
+#> # ℹ 336,766 more rows
+#> # ℹ 11 more variables: arr_delay <dbl>, carrier <chr>, flight <int>,
 #> #   tailnum <chr>, origin <chr>, dest <chr>, air_time <dbl>, distance <dbl>,
-#> #   hour <dbl>, minute <dbl>
+#> #   hour <dbl>, minute <dbl>, time_hour <dttm>
 ```
 
 ``` r
-# Clean up
+# Clean up!
 con |>
   execute_adbc("DROP TABLE flights")
 adbc_connection_release(con)
diff --git a/r/adbcsqlite/README.Rmd b/r/adbcsqlite/README.Rmd
index ffcaee358..950e97e46 100644
--- a/r/adbcsqlite/README.Rmd
+++ b/r/adbcsqlite/README.Rmd
@@ -67,27 +67,23 @@ This is a basic example which shows you how to solve a 
common problem:
 ```{r example}
 library(adbcdrivermanager)
 
-# Use the driver manager to connect to a database
-db <- adbc_database_init(adbcsqlite::adbcsqlite(), uri = ":memory:")
+# Open a new connection to a database
+db <- adbc_database_init(
+  adbcsqlite::adbcsqlite(),
+  uri = ":memory:"
+)
+
 con <- adbc_connection_init(db)
 
 # Write a table
-flights <- nycflights13::flights
-# (timestamp not supported yet)
-flights$time_hour <- NULL
-flights |>
-  write_adbc(con, "flights")
+nycflights13::flights |> write_adbc(con, "flights")
 
-# Query it
+# Issue a query
 con |>
   read_adbc("SELECT * from flights") |>
   tibble::as_tibble()
-```
 
-```{r}
-# Clean up
-con |>
-  execute_adbc("DROP TABLE flights")
+# Clean up!
 adbc_connection_release(con)
 adbc_database_release(db)
 ```
diff --git a/r/adbcsqlite/README.md b/r/adbcsqlite/README.md
index f04f07cbe..9fc8e5d24 100644
--- a/r/adbcsqlite/README.md
+++ b/r/adbcsqlite/README.md
@@ -58,22 +58,22 @@ This is a basic example which shows you how to solve a 
common problem:
 ``` r
 library(adbcdrivermanager)
 
-# Use the driver manager to connect to a database
-db <- adbc_database_init(adbcsqlite::adbcsqlite(), uri = ":memory:")
+# Open a new connection to a database
+db <- adbc_database_init(
+  adbcsqlite::adbcsqlite(),
+  uri = ":memory:"
+)
+
 con <- adbc_connection_init(db)
 
 # Write a table
-flights <- nycflights13::flights
-# (timestamp not supported yet)
-flights$time_hour <- NULL
-flights |>
-  write_adbc(con, "flights")
+nycflights13::flights |> write_adbc(con, "flights")
 
-# Query it
+# Issue a query
 con |>
   read_adbc("SELECT * from flights") |>
   tibble::as_tibble()
-#> # A tibble: 336,776 × 18
+#> # A tibble: 336,776 × 19
 #>     year month   day dep_time sched_dep_time dep_delay arr_time 
sched_arr_time
 #>    <dbl> <dbl> <dbl>    <dbl>          <dbl>     <dbl>    <dbl>          
<dbl>
 #>  1  2013     1     1      517            515         2      830            
819
@@ -87,15 +87,11 @@ con |>
 #>  9  2013     1     1      557            600        -3      838            
846
 #> 10  2013     1     1      558            600        -2      753            
745
 #> # ℹ 336,766 more rows
-#> # ℹ 10 more variables: arr_delay <dbl>, carrier <chr>, flight <dbl>,
+#> # ℹ 11 more variables: arr_delay <dbl>, carrier <chr>, flight <dbl>,
 #> #   tailnum <chr>, origin <chr>, dest <chr>, air_time <dbl>, distance <dbl>,
-#> #   hour <dbl>, minute <dbl>
-```
+#> #   hour <dbl>, minute <dbl>, time_hour <chr>
 
-``` r
-# Clean up
-con |>
-  execute_adbc("DROP TABLE flights")
+# Clean up!
 adbc_connection_release(con)
 adbc_database_release(db)
 ```

(arrow-adbc) branch main updated: docs(r): Update READMEs for R packages (#1707)

Reply via email to