Skip to content

Commit

Permalink
Merge pull request #208 from bcgov/auth
Browse files Browse the repository at this point in the history
Enable catalogue authorization
  • Loading branch information
ateucher authored Jun 4, 2020
2 parents 9a21050 + 55210b9 commit 99971c6
Show file tree
Hide file tree
Showing 8 changed files with 109 additions and 17 deletions.
4 changes: 3 additions & 1 deletion .github/workflows/cmd-check.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@ jobs:
env:
R_REMOTES_NO_ERRORS_FROM_WARNINGS: true
CRAN: ${{ matrix.config.cran }}
cache-version: v2
cache-version: v3

steps:
- uses: actions/checkout@v2
Expand Down Expand Up @@ -82,6 +82,8 @@ jobs:
run: |
remotes::install_deps(dependencies = TRUE, configure.args = c('sf' = '${{ matrix.config.sf_args }}'))
install.packages("rcmdcheck")
# Install dev rmarkdown (https://github.com/rstudio/rmarkdown/pull/1832) for R < 3.6
if (getRversion() < 3.6) remotes::install_github("rstudio/rmarkdown")
shell: Rscript {0}

- name: Check
Expand Down
4 changes: 2 additions & 2 deletions R/bcdc-web-services.R
Original file line number Diff line number Diff line change
Expand Up @@ -94,7 +94,7 @@ bcdc_query_geodata.character <- function(record, crs = 3005) {
query_list <- compact(query_list)

## GET and parse data to sf object
cli <- bcdc_http_client(url = "https://openmaps.gov.bc.ca/geo/pub/wfs")
cli <- bcdc_wfs_client()

cols_df <- feature_helper(record)

Expand Down Expand Up @@ -134,7 +134,7 @@ bcdc_query_geodata.bcdc_record <- function(record, crs = 3005) {
query_list <- compact(query_list)

## GET and parse data to sf object
cli <- bcdc_http_client(url = "https://openmaps.gov.bc.ca/geo/pub/wfs")
cli <- bcdc_wfs_client()

cols_df <- feature_helper(query_list$typeNames)

Expand Down
10 changes: 4 additions & 6 deletions R/bcdc_search.R
Original file line number Diff line number Diff line change
Expand Up @@ -32,8 +32,7 @@ bcdc_search_facets <- function(facet = c("license_id", "download_audience",
query <- paste0("\"", facet, "\"", collapse = ",")
query <- paste0("[", query, "]")

cli <- bcdc_http_client(paste0(base_url(),
"action/package_search"))
cli <- bcdc_catalogue_client("action/package_search")

r <- cli$get(query = list(facet.field = query, rows = 0))
r$raise_for_status()
Expand Down Expand Up @@ -66,7 +65,7 @@ bcdc_list <- function() {
limit <- 1000
while (l_new_ret) {

cli <- bcdc_http_client(paste0(base_url(), "action/package_list"))
cli <- bcdc_catalogue_client("action/package_list")

r <- cli$get(query = list(offset = offset, limit = limit))
r$raise_for_status()
Expand Down Expand Up @@ -138,7 +137,7 @@ bcdc_search <- function(..., license_id = NULL,

query <- gsub("\\s+", "%20", query)

cli <- bcdc_http_client(paste0(base_url(), "action/package_search"))
cli <- bcdc_catalogue_client("action/package_search")

# Use I(query) to treat query as is, so that things like + and :
# aren't encoded as %2B, %3A etc
Expand Down Expand Up @@ -190,8 +189,7 @@ bcdc_get_record <- function(id) {

id <- slug_from_url(id)

cli <- bcdc_http_client(paste0(base_url(),
"action/package_show"))
cli <- bcdc_catalogue_client("action/package_show")

r <- cli$get(query = list(id = id))

Expand Down
3 changes: 1 addition & 2 deletions R/describe-feature.R
Original file line number Diff line number Diff line change
Expand Up @@ -70,8 +70,7 @@ bcdc_describe_feature.bcdc_record <- function(record){
parse_raw_feature_tbl <- function(query_list){

## GET and parse data to sf object
cli <-
bcdc_http_client(url = "https://openmaps.gov.bc.ca/geo/pub/wfs")
cli <- bcdc_wfs_client()

cc <- cli$post(body = query_list, encode = "form")

Expand Down
35 changes: 29 additions & 6 deletions R/utils.R
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,8 @@
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and limitations under the License.

base_url <- function() "https://catalogue.data.gov.bc.ca/api/3/"
catalogue_base_url <- function() "https://catalogue.data.gov.bc.ca/api/3/"
wfs_base_url <- function() "https://openmaps.gov.bc.ca/geo/pub/wfs/"

bcdata_user_agent <- function(){
"https://github.com/bcgov/bcdata"
Expand Down Expand Up @@ -74,11 +75,33 @@ formats_supported <- function(){
c(bcdc_read_functions()[["format"]], "zip")
}

bcdc_http_client <- function(url = NULL) {
bcdc_catalogue_client <- function(endpoint = NULL) {
url <- paste0(catalogue_base_url(), endpoint)
bcdc_http_client(url, auth = TRUE)
}

bcdc_wfs_client <- function(endpoint = NULL) {
url <- paste0(wfs_base_url(), endpoint)
bcdc_http_client(url, auth = FALSE)
}

bcdc_http_client <- function(url, auth = FALSE) {
headers <- list(
`User-Agent` = bcdata_user_agent(),
Authorization = if (auth) bcdc_auth() else NULL
)

crul::HttpClient$new(url = url,
headers = list(`User-Agent` = bcdata_user_agent()))
crul::HttpClient$new(
url = url,
headers = compact(headers)
)
}

bcdc_auth <- function() {
key <- Sys.getenv("BCDC_KEY")
if (!nzchar(key)) return(NULL)
message("Authorizing with your stored API key")
key
}

## Check if there is internet
Expand Down Expand Up @@ -125,7 +148,6 @@ wfs_to_r_col_type <- function(col){
)
}


##from a record
formats_from_record <- function(x, trim = TRUE){

Expand Down Expand Up @@ -197,7 +219,8 @@ read_from_url <- function(resource, ...){
if (!reported_format %in% formats_supported()) {
stop("Reading ", reported_format, " files is not currently supported in bcdata.")
}
cli <- bcdc_http_client(file_url)
auth <- grepl("(catalogue|pub)\\.data\\.gov\\.bc\\.ca", file_url)
cli <- bcdc_http_client(file_url, auth = auth)

## Establish where to download file
tmp <- tempfile(tmpdir = unique_temp_dir(),
Expand Down
28 changes: 28 additions & 0 deletions README.Rmd
Original file line number Diff line number Diff line change
Expand Up @@ -83,6 +83,34 @@ library(bcdata)
- [Exploring Silviculture Data with bcdata](https://bcgov.github.io/bcdata/articles/explore-silviculture-data-using-bcdata.html)
- Using bcdata with [bcmaps](https://github.com/bcgov/bcmaps) (Coming Soon!)

### BCDC Authentication

If you are an authorized editor of the B.C. Data Catalogue you may want to
access records that are not publicly available (e.g., in DRAFT, waiting to be
published). This can be done by authenticating with the catalogue with an API
key.

_**Important Note:**_ *Your API key is like a password and you must take care to
keep it private. Do not share it, and be careful to not include it in any
scripts or accidentally commit it to GitHub.*

You can log in to the catalogue to obtain your API key, then store it as an
environment variable in your [`.Renviron` file](https://rstats.wtf/r-startup.html#renviron).
The environment variable must be called `BCDC_KEY`, set like this:

```
BCDC_KEY=your-api-key
```

This way, the relevant bcdata functions will read that key and use it to
authorize your calls to the catalogue, allowing you to access additional records
that you are authorized to see if you were logged into the catalogue web
interface. Functions that benefit from this are:

- `bcdc_search()`
- `bcdc_list()`
- `bcdc_get_record()`
- `bcdc_get_data()`

### Getting Help or Reporting an Issue

Expand Down
28 changes: 28 additions & 0 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -89,6 +89,34 @@ library(bcdata)
- Using bcdata with [bcmaps](https://github.com/bcgov/bcmaps) (Coming
Soon\!)

### BCDC Authentication

If you are an authorized editor of the B.C. Data Catalogue you may want
to access records that are not publicly available (e.g., in DRAFT,
waiting to be published). This can be done by authenticating with the
catalogue with an API key.

***Important Note:*** *Your API key is like a password and you must take
care to keep it private. Do not share it, and be careful to not include
it in any scripts or accidentally commit it to GitHub.*

You can log in to the catalogue to obtain your API key, then store it as
an environment variable in your [`.Renviron`
file](https://rstats.wtf/r-startup.html#renviron). The environment
variable must be called `BCDC_KEY`, set like this:

BCDC_KEY=your-api-key

This way, the relevant bcdata functions will read that key and use it to
authorize your calls to the catalogue, allowing you to access additional
records that you are authorized to see if you were logged into the
catalogue web interface. Functions that benefit from this are:

- `bcdc_search()`
- `bcdc_list()`
- `bcdc_get_record()`
- `bcdc_get_data()`

### Getting Help or Reporting an Issue

To report bugs/issues/feature requests, please file an
Expand Down
14 changes: 14 additions & 0 deletions tests/testthat/test-get_record.R
Original file line number Diff line number Diff line change
Expand Up @@ -95,4 +95,18 @@ expect_error(bcdc_tidy_resources("WHSE_IMAGERY_AND_BASE_MAPS.GSR_AIRPORTS_SVW"),
"No bcdc_tidy_resources method for a BCGW object name")
})

test_that("bcdc_get_record works with/without authentication", {
skip_if_net_down()
skip_on_cran()

key_val <- Sys.getenv("BCDC_KEY")
skip_if_not(nzchar(key_val))
on.exit(Sys.setenv(BCDC_KEY = key_val))

expect_message(res <- bcdc_get_record('76b1b7a3-2112-4444-857a-afccf7b20da8'),
"Authorizing with your stored API key")
expect_is(res, "bcdc_record")

Sys.unsetenv("BCDC_KEY")
expect_silent(bcdc_get_record('76b1b7a3-2112-4444-857a-afccf7b20da8'))
})

0 comments on commit 99971c6

Please sign in to comment.