@@ -10184,6 +10184,9 @@ make_figshare_docs_skeleton <- function(where){
1018410184
1018510185prepare_site_metadata_for_figshare <- function(outfile){
1018610186
10187+ #writes to figshare directory, where it then gets moved to edi directory,
10188+ #but also writes the site_data file for the ms package
10189+
1018710190 figd <- select(site_data,
1018810191 network, pretty_network, domain, pretty_domain, site_code,
1018910192 epsg_code = CRS,
@@ -10212,6 +10215,9 @@ prepare_site_metadata_for_figshare <- function(outfile){
1021210215 last_record_utc = LastRecordUTC,
1021310216 timezone_olson)
1021410217
10218+ ms_site_data <- figd
10219+ save(ms_site_data, file = '../r_package/data/ms_site_data.RData')
10220+
1021510221 write_csv(figd, outfile)
1021610222}
1021710223
@@ -10226,6 +10232,8 @@ prepare_variable_metadata_for_figshare <- function(outfile, fs_format){
1022610232 # in old-mode, just one variable metadata file is written. in new format, it's split into
1022710233 # timeseries and ws attrs. In new format, range check limits are written too, as a third file.
1022810234
10235+ #also writes RData file for ms package
10236+
1022910237 if(fs_format == 'new'){
1023010238
1023110239 outfile_ts <- file.path(dirname(outfile),
@@ -10240,7 +10248,7 @@ prepare_variable_metadata_for_figshare <- function(outfile, fs_format){
1024010248 '05_timeseries_documentation',
1024110249 '05e_range_check_limits.csv')
1024210250
10243- read_csv('../portal/data/general/catalog_files/all_variables.csv',
10251+ ms_vars_ts <- read_csv('../portal/data/general/catalog_files/all_variables.csv',
1024410252 col_types = cols()) %>%
1024510253 select(variable_code = VariableCode,
1024610254 variable_name = VariableName,
@@ -10252,13 +10260,17 @@ prepare_variable_metadata_for_figshare <- function(outfile, fs_format){
1025210260 # mean_obs_per_site = MeanObsPerSite,
1025310261 first_record_utc = FirstRecordUTC,
1025410262 last_record_utc = LastRecordUTC) %>%
10255- filter(! grepl('_flux$', chem_category)) %>%#TEMP: removing flux metadata
10256- write_csv(outfile_ts)
10263+ filter(! grepl('_flux$', chem_category)) #TEMP: removing flux metadata
1025710264
10258- ms_vars %>%
10265+ write_csv(ms_vars_ts, outfile_ts)
10266+ save(ms_vars_ts, file = '../r_package/data/ms_vars_ts.RData')
10267+
10268+ ms_vars_ws <- ms_vars %>%
1025910269 filter(variable_type == 'ws_char') %>%
10260- select(variable_code, variable_name, unit) %>%
10261- write_csv(outfile_ws)
10270+ select(variable_code, variable_name, unit)
10271+
10272+ write_csv(ms_vars_ws, outfile_ws)
10273+ save(ms_vars_ws, file = '../r_package/data/ms_vars_ws_attr.RData')
1026210274
1026310275 ms_vars %>%
1026410276 filter(variable_type != 'ws_char') %>%
@@ -10352,7 +10364,17 @@ assemble_misc_docs_figshare <- function(where){
1035210364 attrib_ts_data <- postprocess_attribution_ts()
1035310365 write_csv(attrib_ts_data, file.path(docs_dir, '01b_attribution_and_intellectual_rights_complete.csv'))
1035410366
10355- #this dataset is required for macrosheds package functioning
10367+ attrib_ws_data <- googlesheets4::read_sheet(
10368+ conf$univ_prods_gsheet,
10369+ na = c('', 'NA'),
10370+ col_types = 'c'
10371+ ) %>%
10372+ select(prodname, primary_source = data_source, retrieved_from_GEE = type,
10373+ doi, license, citation, url, addtl_info = notes) %>%
10374+ mutate(retrieved_from_GEE = ifelse(retrieved_from_GEE == 'gee', TRUE, FALSE))
10375+
10376+ #these datasets required for macrosheds package functioning
10377+ save(attrib_ws_data, file = '../r_package/data/attribution_and_intellectual_rights_ws_attr.RData')
1035610378 save(attrib_ts_data, file = '../r_package/data/attribution_and_intellectual_rights_timeseries.RData')
1035710379
1035810380 select(domain_detection_limits, -precision, -sigfigs, -added_programmatically) %>%
@@ -14102,7 +14124,7 @@ generate_watershed_summaries <- function(){
1410214124 var == 'va_npp_median') %>%
1410314125 group_by(site_code) %>%
1410414126 summarize(va_mean_annual_npp = mean(val, na.arm = TRUE)) %>%
14105- filter(!is.na(va_mean_annual_npp))
14127+ filter(! is.na(va_mean_annual_npp))
1410614128
1410714129 # terrain
1410814130 terrain_fils <- fils[grepl('/terrain', fils)]
@@ -14169,20 +14191,20 @@ generate_watershed_summaries <- function(){
1416914191 !is.na(val)) %>%
1417014192 select(-year) %>%
1417114193 group_by(site_code) %>%
14172- ungroup() %>%
1417314194 summarize(ck_mean_annual_et = mean(val, na.rm = TRUE)) %>%
14174- filter( ! is.na(ck_mean_annual_et))
14195+ ungroup() %>%
14196+ filter(! is.na(ck_mean_annual_et))
1417514197
1417614198 # geological chem
1417714199 geochem_fils <- fils[grepl('/geochemical', fils)]
1417814200
1417914201 geochem <- map_dfr(geochem_fils, read_feather) %>%
1418014202 filter(grepl('mean$', var),
14181- !is.na(val)) %>%
14203+ ! is.na(val)) %>%
1418214204 select(-year) %>%
1418314205 group_by(site_code, var) %>%
14184- ungroup() %>%
1418514206 summarize(mean_val = mean(val, na.rm = TRUE)) %>%
14207+ ungroup() %>%
1418614208 pivot_wider(names_from = 'var', values_from = 'mean_val')
1418714209
1418814210 # fpar
@@ -14193,8 +14215,9 @@ generate_watershed_summaries <- function(){
1419314215 ! is.na(val)) %>%
1419414216 select(-year) %>%
1419514217 group_by(site_code) %>%
14218+ summarize(vb_mean_annual_fpar = mean(val)) %>%
1419614219 ungroup() %>%
14197- summarise(vb_mean_annual_fpar = mean(val ))
14220+ filter(! is.na(vb_mean_annual_fpar ))
1419814221
1419914222 # lai
1420014223 ff <- fils[grepl('/lai', fils) & grepl('/sum_', fils)]
@@ -14204,8 +14227,9 @@ generate_watershed_summaries <- function(){
1420414227 ! is.na(val)) %>%
1420514228 select(-year) %>%
1420614229 group_by(site_code) %>%
14230+ summarize(vb_mean_annual_lai = mean(val)) %>%
1420714231 ungroup() %>%
14208- summarise(vb_mean_annual_lai = mean(val ))
14232+ filter(! is.na(vb_mean_annual_lai ))
1420914233
1421014234 # tcw (tesselated cap wetness)
1421114235 ff <- fils[grepl('/tcw', fils) & grepl('/sum_', fils)]
@@ -14215,8 +14239,9 @@ generate_watershed_summaries <- function(){
1421514239 ! is.na(val)) %>%
1421614240 select(-year) %>%
1421714241 group_by(site_code) %>%
14242+ summarize(vj_mean_annual_tcw = mean(val)) %>%
1421814243 ungroup() %>%
14219- summarise(vj_mean_annual_tcw = mean(val ))
14244+ filter(! is.na(vj_mean_annual_tcw ))
1422014245
1422114246 # ndvi
1422214247 ff <- fils[grepl('/ndvi', fils) & grepl('/sum_', fils)]
@@ -14226,8 +14251,9 @@ generate_watershed_summaries <- function(){
1422614251 ! is.na(val)) %>%
1422714252 select(-year) %>%
1422814253 group_by(site_code) %>%
14254+ summarize(vb_mean_annual_ndvi = mean(val)) %>%
1422914255 ungroup() %>%
14230- summarize(vb_mean_annual_ndvi = mean(val ))
14256+ filter(! is.na(vb_mean_annual_ndvi ))
1423114257
1423214258 # nsidc snow data
1423314259 ff <- fils[grepl('/nsidc', fils) & grepl('/sum_', fils)]
0 commit comments