-
Notifications
You must be signed in to change notification settings - Fork 19
/
Copy pathOSDquery.R
141 lines (121 loc) · 5.25 KB
/
OSDquery.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
# https://www.postgresql.org/docs/9.5/static/textsearch-controls.html
# these are all parameters expected by the SoilWeb OSD Fulltext search
#' Search full text of Official Series Description on SoilWeb
#'
#' @description This is the R interface to \href{https://casoilresource.lawr.ucdavis.edu/osd-search/}{OSD search by Section} and \href{https://casoilresource.lawr.ucdavis.edu/osd-search/search-entire-osd.php}{OSD Search} APIs provided by SoilWeb.
#'
#' OSD records are searched with the \href{https://www.postgresql.org/docs/9.5/textsearch.html}{PostgreSQL fulltext indexing} and query system (\href{https://www.postgresql.org/docs/9.5/datatype-textsearch.html}{syntax details}). Each search field (except for the "brief narrative" and MLRA) corresponds with a section header in an OSD. The results may not include every OSD due to formatting errors and typos. Results are scored based on the number of times search terms match words in associated sections.
#'
#' @param everything search entire OSD text (default is NULL), `mlra` may also be specified, all other arguments are ignored
#' @param mlra a comma-delimited string of MLRA to search ('17,18,22A')
#' @param taxonomic_class search family level classification
#' @param typical_pedon search typical pedon section
#' @param brief_narrative search brief narrative
#' @param ric search range in characteristics section
#' @param use_and_veg search use and vegetation section
#' @param competing_series search competing series section
#' @param geog_location search geographic setting section
#' @param geog_assoc_soils search geographically associated soils section
#'
#' @details
#' See \href{https://casoilresource.lawr.ucdavis.edu/osd-search/}{this webpage} for more information.
#'
#' - family level taxa are derived from SC database, not parsed OSD records
#'
#' - MLRA are derived via spatial intersection (SSURGO x MLRA polygons)
#'
#' - MLRA-filtering is only possible for series used in the current SSURGO snapshot (component name)
#'
#' - logical AND: &
#'
#' - logical OR: |
#'
#' - wildcard, e.g. rhy-something rhy:*
#'
#' - search terms with spaces need doubled single quotes: ''san joaquin''
#'
#' - combine search terms into a single expression: (grano:* | granite)
#'
#' Related documentation can be found in the following tutorials
#' - [overview of all soil series query functions](http://ncss-tech.github.io/AQP/soilDB/soil-series-query-functions.html)
#' - [competing soil series](https://ncss-tech.github.io/AQP/soilDB/competing-series.html)
#' - [siblings](https://ncss-tech.github.io/AQP/soilDB/siblings.html)
#'
#' @references USDA-NRCS OSD search tools: \url{https://soilseries.sc.egov.usda.gov/}
#'
#' @author D.E. Beaudette
#'
#' @note SoilWeb maintains a snapshot of the Official Series Description data.
#'
#' @seealso \code{\link{fetchOSD}, \link{siblings}, \link{fetchOSD}}
#'
#' @keywords manip
#'
#' @return a \code{data.frame} object containing soil series names that match patterns supplied as arguments.
#' @export
#' @examplesIf curl::has_internet() && require(aqp)
#' @examples
#'
#' \donttest{
#' # find all series that list Pardee as a geographically associated soil.
#' s <- OSDquery(geog_assoc_soils = 'pardee')
#'
#' # get data for these series
#' x <- fetchOSD(s$series, extended = TRUE, colorState = 'dry')
#'
#' # simple figure
#' par(mar=c(0,0,1,1))
#' plot(x$SPC)
#' }
#'
OSDquery <- function(everything = NULL, mlra='', taxonomic_class='', typical_pedon='', brief_narrative='', ric='', use_and_veg='', competing_series='', geog_location='', geog_assoc_soils='') {
# check for required packages
if(!requireNamespace('httr', quietly=TRUE) | !requireNamespace('jsonlite', quietly=TRUE))
stop('please install the `httr` and `jsonlite` packages', call.=FALSE)
# sanity checks
# mode selection
if(is.null(everything)) {
## searching by sections
# build parameters list
parameters=list(
json = 1,
mlra = mlra,
taxonomic_class = taxonomic_class,
typical_pedon = typical_pedon,
brief_narrative = brief_narrative,
ric = ric,
use_and_veg = use_and_veg,
competing_series = competing_series,
geog_location = geog_location,
geog_assoc_soils = geog_assoc_soils
)
# API URL
# note: this is the load-balancer
u <- 'https://casoilresource.lawr.ucdavis.edu/osd-search/index.php'
} else {
## searching entire OSD text
# build parameters list
parameters=list(
json = 1,
query = everything,
mlra = mlra
)
# API URL
# note: this is the load-balancer
u <- 'https://casoilresource.lawr.ucdavis.edu/osd-search/search-entire-osd.php'
}
# submit via POST
res <- httr::POST(u, body = parameters, encode='form')
# TODO: figure out what an error state looks like
# trap errors, likely related to SQL syntax errors
request.status <- try(httr::stop_for_status(res), silent = TRUE)
# the result is JSON
# should simplify to data.frame nicely
r.content <- httr::content(res, as = 'text', encoding = 'UTF-8')
d <- jsonlite::fromJSON(r.content)
# results will either be: data.frame, empty list, or NULL
# ensure result is either data.frame or NULL
if(inherits(d, 'list') & length(d) < 1)
return(NULL)
return(d)
}