forked from ankane/trend-api
-
Notifications
You must be signed in to change notification settings - Fork 0
/
helpers.R
80 lines (64 loc) · 1.7 KB
/
helpers.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
prepareSeries <- function(series, frequency, name="series"){
if (is.null(series)) {
stop(paste("[400] Missing parameter:", name))
}
# remove null values
series[sapply(series, is.null)] <- NULL
if (length(series) < 10) {
stop(paste("[400] Invalid parameter:", name, "must have at least 10 data points"))
}
tryCatch({
ds <- names(series)
y <- as.numeric(series)
if (any(nchar(ds) > 10)) {
ds <- anytime(ds)
} else {
ds <- anydate(ds)
}
}, error=function(err) {
stop(paste("[400] Missing parameter:", name))
})
if(any(duplicated(ds)) || any(sapply(ds, is.na))) {
stop(paste("[400] Missing parameter:", name))
}
data <- data.frame(ds=ds, y=y)
data <- data[order(data$ds),]
interval <- get_interval(data$ds)
if (is.null(frequency)) {
if (interval == "day") {
frequency <- 7
} else if (interval == "month") {
frequency <- 12
} else {
frequency <- detectFrequency(data$y)
}
}
data <- data %>% pad(interval=interval)
if (nrow(data) > 1000) {
stop(paste("[400] Invalid parameter: computed", name, "can have a max of 1000 data points"))
}
missing_p <- sum(is.na(data$y)) / nrow(data)
if (missing_p > 0.2) {
stop(paste("[400] Invalid parameter:", name, "missing too much data"))
}
ts <- ts(data$y, frequency=frequency)
bad <- FALSE
tryCatch({
ts <- na.interp(ts)
}, warning=function(w) {
bad <<- TRUE
})
list(ts=ts, ds=data$ds, bad=bad, interval=interval, frequency=frequency)
}
detectFrequency <- function(y) {
if (is.constant(y)) {
1
} else {
findfrequency(y)
}
}
formatTime <- function(ds) {
r <- rfc3339(ds)
stri_sub(r[nchar(r) == 24], -2, -3) <- ":"
r
}