Skip to content

Commit 8477d0b

Browse files
committed
writing more files to package data; now rebuilding v1 dataset
1 parent 2b97756 commit 8477d0b

3 files changed

Lines changed: 50 additions & 17 deletions

File tree

src/global/general.R

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -44,7 +44,7 @@ ws_areas <- site_data %>%
4444
select(site_code, ws_area_ha)
4545

4646
boundaries <- boundaries %>%
47-
select(-area) %>%
47+
select(-any_of('area')) %>%
4848
left_join(ws_areas) %>%
4949
rename(area = ws_area_ha)
5050

src/global/global_helpers.R

Lines changed: 42 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -10184,6 +10184,9 @@ make_figshare_docs_skeleton <- function(where){
1018410184

1018510185
prepare_site_metadata_for_figshare <- function(outfile){
1018610186

10187+
#writes to figshare directory, where it then gets moved to edi directory,
10188+
#but also writes the site_data file for the ms package
10189+
1018710190
figd <- select(site_data,
1018810191
network, pretty_network, domain, pretty_domain, site_code,
1018910192
epsg_code = CRS,
@@ -10212,6 +10215,9 @@ prepare_site_metadata_for_figshare <- function(outfile){
1021210215
last_record_utc = LastRecordUTC,
1021310216
timezone_olson)
1021410217

10218+
ms_site_data <- figd
10219+
save(ms_site_data, file = '../r_package/data/ms_site_data.RData')
10220+
1021510221
write_csv(figd, outfile)
1021610222
}
1021710223

@@ -10226,6 +10232,8 @@ prepare_variable_metadata_for_figshare <- function(outfile, fs_format){
1022610232
# in old-mode, just one variable metadata file is written. in new format, it's split into
1022710233
# timeseries and ws attrs. In new format, range check limits are written too, as a third file.
1022810234

10235+
#also writes RData file for ms package
10236+
1022910237
if(fs_format == 'new'){
1023010238

1023110239
outfile_ts <- file.path(dirname(outfile),
@@ -10240,7 +10248,7 @@ prepare_variable_metadata_for_figshare <- function(outfile, fs_format){
1024010248
'05_timeseries_documentation',
1024110249
'05e_range_check_limits.csv')
1024210250

10243-
read_csv('../portal/data/general/catalog_files/all_variables.csv',
10251+
ms_vars_ts <- read_csv('../portal/data/general/catalog_files/all_variables.csv',
1024410252
col_types = cols()) %>%
1024510253
select(variable_code = VariableCode,
1024610254
variable_name = VariableName,
@@ -10252,13 +10260,17 @@ prepare_variable_metadata_for_figshare <- function(outfile, fs_format){
1025210260
# mean_obs_per_site = MeanObsPerSite,
1025310261
first_record_utc = FirstRecordUTC,
1025410262
last_record_utc = LastRecordUTC) %>%
10255-
filter(! grepl('_flux$', chem_category)) %>%#TEMP: removing flux metadata
10256-
write_csv(outfile_ts)
10263+
filter(! grepl('_flux$', chem_category)) #TEMP: removing flux metadata
1025710264

10258-
ms_vars %>%
10265+
write_csv(ms_vars_ts, outfile_ts)
10266+
save(ms_vars_ts, file = '../r_package/data/ms_vars_ts.RData')
10267+
10268+
ms_vars_ws <- ms_vars %>%
1025910269
filter(variable_type == 'ws_char') %>%
10260-
select(variable_code, variable_name, unit) %>%
10261-
write_csv(outfile_ws)
10270+
select(variable_code, variable_name, unit)
10271+
10272+
write_csv(ms_vars_ws, outfile_ws)
10273+
save(ms_vars_ws, file = '../r_package/data/ms_vars_ws_attr.RData')
1026210274

1026310275
ms_vars %>%
1026410276
filter(variable_type != 'ws_char') %>%
@@ -10352,7 +10364,17 @@ assemble_misc_docs_figshare <- function(where){
1035210364
attrib_ts_data <- postprocess_attribution_ts()
1035310365
write_csv(attrib_ts_data, file.path(docs_dir, '01b_attribution_and_intellectual_rights_complete.csv'))
1035410366

10355-
#this dataset is required for macrosheds package functioning
10367+
attrib_ws_data <- googlesheets4::read_sheet(
10368+
conf$univ_prods_gsheet,
10369+
na = c('', 'NA'),
10370+
col_types = 'c'
10371+
) %>%
10372+
select(prodname, primary_source = data_source, retrieved_from_GEE = type,
10373+
doi, license, citation, url, addtl_info = notes) %>%
10374+
mutate(retrieved_from_GEE = ifelse(retrieved_from_GEE == 'gee', TRUE, FALSE))
10375+
10376+
#these datasets required for macrosheds package functioning
10377+
save(attrib_ws_data, file = '../r_package/data/attribution_and_intellectual_rights_ws_attr.RData')
1035610378
save(attrib_ts_data, file = '../r_package/data/attribution_and_intellectual_rights_timeseries.RData')
1035710379

1035810380
select(domain_detection_limits, -precision, -sigfigs, -added_programmatically) %>%
@@ -14102,7 +14124,7 @@ generate_watershed_summaries <- function(){
1410214124
var == 'va_npp_median') %>%
1410314125
group_by(site_code) %>%
1410414126
summarize(va_mean_annual_npp = mean(val, na.arm = TRUE)) %>%
14105-
filter(!is.na(va_mean_annual_npp))
14127+
filter(! is.na(va_mean_annual_npp))
1410614128

1410714129
# terrain
1410814130
terrain_fils <- fils[grepl('/terrain', fils)]
@@ -14169,20 +14191,20 @@ generate_watershed_summaries <- function(){
1416914191
!is.na(val)) %>%
1417014192
select(-year) %>%
1417114193
group_by(site_code) %>%
14172-
ungroup() %>%
1417314194
summarize(ck_mean_annual_et = mean(val, na.rm = TRUE)) %>%
14174-
filter( ! is.na(ck_mean_annual_et))
14195+
ungroup() %>%
14196+
filter(! is.na(ck_mean_annual_et))
1417514197

1417614198
# geological chem
1417714199
geochem_fils <- fils[grepl('/geochemical', fils)]
1417814200

1417914201
geochem <- map_dfr(geochem_fils, read_feather) %>%
1418014202
filter(grepl('mean$', var),
14181-
!is.na(val)) %>%
14203+
! is.na(val)) %>%
1418214204
select(-year) %>%
1418314205
group_by(site_code, var) %>%
14184-
ungroup() %>%
1418514206
summarize(mean_val = mean(val, na.rm = TRUE)) %>%
14207+
ungroup() %>%
1418614208
pivot_wider(names_from = 'var', values_from = 'mean_val')
1418714209

1418814210
# fpar
@@ -14193,8 +14215,9 @@ generate_watershed_summaries <- function(){
1419314215
! is.na(val)) %>%
1419414216
select(-year) %>%
1419514217
group_by(site_code) %>%
14218+
summarize(vb_mean_annual_fpar = mean(val)) %>%
1419614219
ungroup() %>%
14197-
summarise(vb_mean_annual_fpar = mean(val))
14220+
filter(! is.na(vb_mean_annual_fpar))
1419814221

1419914222
# lai
1420014223
ff <- fils[grepl('/lai', fils) & grepl('/sum_', fils)]
@@ -14204,8 +14227,9 @@ generate_watershed_summaries <- function(){
1420414227
! is.na(val)) %>%
1420514228
select(-year) %>%
1420614229
group_by(site_code) %>%
14230+
summarize(vb_mean_annual_lai = mean(val)) %>%
1420714231
ungroup() %>%
14208-
summarise(vb_mean_annual_lai = mean(val))
14232+
filter(! is.na(vb_mean_annual_lai))
1420914233

1421014234
# tcw (tesselated cap wetness)
1421114235
ff <- fils[grepl('/tcw', fils) & grepl('/sum_', fils)]
@@ -14215,8 +14239,9 @@ generate_watershed_summaries <- function(){
1421514239
! is.na(val)) %>%
1421614240
select(-year) %>%
1421714241
group_by(site_code) %>%
14242+
summarize(vj_mean_annual_tcw = mean(val)) %>%
1421814243
ungroup() %>%
14219-
summarise(vj_mean_annual_tcw = mean(val))
14244+
filter(! is.na(vj_mean_annual_tcw))
1422014245

1422114246
# ndvi
1422214247
ff <- fils[grepl('/ndvi', fils) & grepl('/sum_', fils)]
@@ -14226,8 +14251,9 @@ generate_watershed_summaries <- function(){
1422614251
! is.na(val)) %>%
1422714252
select(-year) %>%
1422814253
group_by(site_code) %>%
14254+
summarize(vb_mean_annual_ndvi = mean(val)) %>%
1422914255
ungroup() %>%
14230-
summarize(vb_mean_annual_ndvi = mean(val))
14256+
filter(! is.na(vb_mean_annual_ndvi))
1423114257

1423214258
# nsidc snow data
1423314259
ff <- fils[grepl('/nsidc', fils) & grepl('/sum_', fils)]

src/global/one-off/build_eml_templates.R

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -405,6 +405,13 @@ for(td in ts_dmns){
405405

406406
# template_categorical_variables(wd, dd)
407407

408+
# include bibtex files with macrosheds R package ####
409+
410+
ts_bib <- readr::read_file('eml/data_links/timeseries_refs.bib')
411+
save(ts_bib, file = '../r_package/data/bibtex_timeseries.RData')
412+
ws_bib <- readr::read_file('eml/data_links/ws_attr_refs.bib')
413+
save(ws_bib, file = '../r_package/data/bibtex_ws_attr.RData')
414+
408415
# write EML** ####
409416

410417
# temporal_coverage <- map(ts_tables, ~range(read_csv(.)$datetime)) %>%

0 commit comments

Comments
 (0)