-
Notifications
You must be signed in to change notification settings - Fork 6
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
plug timeline into pipeline #39
Changes from 13 commits
5b534c6
7a870eb
fbfd6e0
7a0daa5
9e8919e
56f26e4
f658ad5
07333f5
9914c06
c9dca03
d166d0d
79cecf1
bf4bb65
d954898
cbc0815
3cf86f1
a6de9c8
fb7550c
3bbb3ce
e379f32
ef861e8
d2056b8
e2750ad
a07ccd9
4a529b5
b951de9
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -3,16 +3,19 @@ add_paths_to_data <- function(data_in) { | |
data_in %>% mutate(path = build_path_peak(daily_quant)) | ||
} | ||
|
||
add_colors_to_data <- function(data_in, scico_palette_nm = "roma") { | ||
add_colors_to_data <- function(data_in, scico_palette_nm = "roma", gw_time) { | ||
# Create 5 color palette | ||
col_palette <- rev(scico::scico(5, palette = scico_palette_nm)) | ||
|
||
data_in %>% | ||
# Add number 1:365 for day of water year for each site | ||
group_by(site_no) %>% | ||
arrange(Date) %>% | ||
mutate(wyday = row_number()) %>% | ||
ungroup() %>% | ||
date_full <- data_in %>% | ||
# create a row for every date x site | ||
mutate(site_no = as.character(site_no)) %>% | ||
expand(Date, site_no) %>% | ||
distinct() | ||
|
||
gw_time %>% | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Adding a comment about what is happening here and why would be very useful! After running the code and exploring, I think that these left joins effectively filter the data so that each site has values for the first day of every month in the data set. |
||
left_join(date_full) %>% | ||
left_join(data_in %>% mutate(site_no = as.character(site_no))) %>% | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Doing the step above to change how this data is read in would simplify this line to |
||
# Add color based on quantile category | ||
mutate(color = ifelse( | ||
quant_category == "Very high", | ||
|
@@ -26,3 +29,28 @@ add_colors_to_data <- function(data_in, scico_palette_nm = "roma") { | |
quant_category == "Very low", | ||
yes = col_palette[5], no = "black")))))) | ||
} | ||
generate_time <- function(data_in) { | ||
date_start <- min(gw_anomaly_data$Date) | ||
cnell-usgs marked this conversation as resolved.
Show resolved
Hide resolved
|
||
date_end <- max(gw_anomaly_data$Date) | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Consider adding |
||
|
||
time_df <- tibble(Date = seq.Date(from = date_start, | ||
to = date_end, | ||
by = "1 day")) %>% | ||
mutate(day_seq = as.numeric(rownames(.))) %>% | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
|
||
arrange(day_seq) | ||
cnell-usgs marked this conversation as resolved.
Show resolved
Hide resolved
|
||
|
||
return(time_df) | ||
|
||
} | ||
generate_months <- function(file_out, data_in){ | ||
data_in %>% | ||
mutate(month = lubridate::month(Date), | ||
month_label = lubridate::month(Date, label = TRUE), | ||
year = lubridate::year(Date)) %>% | ||
group_by(month, month_label, year) %>% | ||
filter(day_seq == min(day_seq)) %>% ## find the first day of each month to draw labels | ||
ungroup() %>% | ||
group_by(year) %>% | ||
mutate(year_label = ifelse(day_seq == min(day_seq), year, NA)) %>% | ||
cnell-usgs marked this conversation as resolved.
Show resolved
Hide resolved
|
||
write_csv(file_out) | ||
} |
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -19,26 +19,19 @@ targets: | |
|
||
3_visualize: | ||
depends: | ||
- 3_visualize/out/anomaly_peaks.svg | ||
- src/assets/anomaly_peaks.svg | ||
- public/gw_sites.csv | ||
- public/date_peaks.csv | ||
- src/assets/anomaly_peaks.svg | ||
- public/gw_sites.csv ## this is in aws as gw-conditions-sites.csv | ||
- public/gw-conditions-wy20.csv ## in aws as gw-conditions-wy20.csv | ||
- public/gw-conditions-daily-count.csv ## in aws as gw-conditions-daily-count.csv | ||
|
||
3_visualize/out/anomaly_peaks.svg: | ||
# exports that are leveraged by vue | ||
src/assets/anomaly_peaks.svg: | ||
command: build_peaks_svg( | ||
target_name, | ||
data_in = gw_anomaly_data_w_colors, | ||
sites_sf = gw_sites_sf, | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. You took out these two arguments but the function itself, still has these included in its definition. |
||
svg_width = svg_width, | ||
svg_height = svg_height) | ||
|
||
src/assets/anomaly_peaks.svg: | ||
command: file.copy( | ||
to = target_name, | ||
from = '3_visualize/out/anomaly_peaks.svg', | ||
overwrite = TRUE) | ||
|
||
public/date_peaks.csv: | ||
public/gw-conditions-wy20.csv: | ||
command: gwl_to_peak( | ||
target_name, | ||
gw_anomaly_data_w_colors) | ||
|
@@ -47,9 +40,10 @@ targets: | |
command: get_site_coords( | ||
target_name, | ||
sites_sf = gw_sites_sf) | ||
public/gwl_daily_count.csv: | ||
|
||
public/gw-conditions-daily-count.csv: | ||
command: site_prop_timeseries(target_name, | ||
gw_anomaly_data_w_colors) | ||
|
||
|
||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -5,33 +5,5 @@ build_peaks_svg <- function(out_file, data_in, sites_sf, svg_width, svg_height) | |
|
||
add_background_map(svg_root, svg_width = svg_width, outline_states = FALSE) | ||
|
||
# Add spark line within group per site | ||
|
||
# TODO: THIS ONLY WORKS FOR A SINGLE DAY RIGHT NOW. I CHOSE OCT 31, 2019 | ||
# TODO: Blanket removing any path with an NA in it. There is a smarter way | ||
# to do this but will come back to that. | ||
data_in <- data_in %>% | ||
filter(Date == as.Date("2019-10-31")) %>% | ||
filter(!grepl("NA", path)) | ||
|
||
sites <- sites_sf %>% pull(site_no) %>% unique | ||
for(s in sites) { | ||
site_coords_svg <- sites_sf %>% | ||
filter(site_no == s) %>% | ||
convert_coords_to_svg(svg_width = svg_width, view_bbox = st_bbox(generate_usa_map_data())) | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. So you are no longer using the SVG with the sites already included? You are adding via D3? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Yes I left some notes about that here #18 (comment) I think it's worth returning to this to draw the initial map from the pipeline, and then grab those paths with D3 for the animation. I was hitting some blocks with how it was set up though due to missing sites when there wasn't data on the first day, and the way I was modifying them with D3 (was creating duplicate elements). This PR addresses those issues but is slower to load. |
||
|
||
gw_data_s <- data_in %>% filter(site_no == s) | ||
|
||
# Spark lines centered at GW location | ||
svg_root %>% | ||
add_grp(grp_nm = s, trans_x = site_coords_svg$x, | ||
trans_y = site_coords_svg$y) %>% | ||
xml_add_child("path", | ||
class = sprintf('gwl_%s', s), | ||
style = sprintf("stroke: none; fill: %s; fill-opacity: 50%%", gw_data_s$color), | ||
d = gw_data_s$path) | ||
|
||
} | ||
|
||
xml2::write_xml(svg_root, file = out_file) | ||
} |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,7 +1,7 @@ | ||
color,peak_mid,quant,path_quant | ||
#7E1900,5,Verylow,M-10 0 C -10 0 0 45 10 0 Z | ||
#C1A53A,17.5,Low,M-10 0 C -10 0 0 32 10 0 Z | ||
#8fce83,50,Normal,M-10 0 C -10 0 0 15 10 0 Z | ||
#8fce83,50,Normal,M-10 0 C -10 0 0 -15 10 0 Z | ||
#479BC5,82.5,High,M-10 0 C -10 0 0 -32 10 0 Z | ||
#1A3399,95,Veryhigh,M-10 0 C -10 0 0 -45 10 0 Z | ||
peak_mid,quant,path_quant | ||
5,Verylow,M-10 0 C -10 0 0 45 10 0 Z | ||
17.5,Low,M-10 0 C -10 0 0 32 10 0 Z | ||
50,Normal,M-10 0 C -10 0 0 15 10 0 Z | ||
50,Normal,M-10 0 C -10 0 0 -15 10 0 Z | ||
82.5,High,M-10 0 C -10 0 0 -32 10 0 Z | ||
95,Veryhigh,M-10 0 C -10 0 0 -45 10 0 Z |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
is this necessary? The
site_no
column should already be character. If not, we should fix here where it is loaded rather than deal with it downstream.Could change this to: