-
Notifications
You must be signed in to change notification settings - Fork 19
/
Copy pathresearchModelK.R
119 lines (106 loc) · 4.05 KB
/
researchModelK.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
# Title, : Research for model K using Random Forest trees.
# Objective : Evaluate how well fits the RF model to multiples symbols.
# Created by: pablocc
# Created on: 08/09/2020
# CONCLUSION: Generalized daily aspects / planets activation don't provide a significant relationship
# that can help to predict price difference, seems that aspect effect cannot be separated from
# the planets that originated the aspect relationship. The next investigation is to verify
# if keeping one aspect feature per fast planet could provide relevant significance and generalization.
library(caret)
library(magrittr)
library(parallel)
library(psych)
library(plyr)
library(randomForest)
library(rattle)
library(tidyverse)
source("./indicatorPlots.r")
dailyAspects <- prepareHourlyAspectsModelK()
symbol <- "LINK-USD"
securityData <- mainOpenSecurity(
symbol, 14, 28, "%Y-%m-%d",
"2010-01-01", "2020-08-15"
)
# Experiment with Random Forest model.
aspectViewRaw <- dailyAspects
#aspectViewRaw <- dailyAspects[p.x != "MO"]
aspectsT <- paste("a", aspects, sep = "")
aspectsX <- paste("a", aspects, ".x", sep = "")
aspectsY <- paste("a", aspects, ".y", sep = "")
aspectsG <- paste("a", aspects, ".g", sep = "")
#selectCols <- c("result", "acx", aspectsX, "spp", "dcp", "zx", "zy", "MO", "ME", "VE", "SU", "MA", "JU", "SA")
#selectCols <- c("result", aspectsX, "ME.x", "VE.x", "MA.x", "JU.x", "SA.x", "NN.x")
aspectsCols <- c(
aspectsX, aspectsY,
"agt", "wd",
"VE.x", "SU.x", "MA.x", "JU.x", "NN.x",
"PL", "MO",
"ME.y", "VE.y", "SU.y", "MA.y", "JU.y", "NN.y", "UR.y",
"sp.x", "sp.y",
"dc.x", "dc.y"
)
selectCols <- c("Date", aspectsCols)
aspectView <- aspectViewRaw[, ..selectCols]
aspectView <- aspectView[, lapply(.SD, function(x) max(x)), .SDcols = aspectsCols, by="Date"]
aspectView <- merge(securityData[, c('Date', 'diffPercent')], aspectView, by = "Date")
varCorrelations <- aspectView[, -c('Date')] %>%
cor() %>%
round(digits = 2)
finalCorrelations <- sort(varCorrelations[, 1])
print(finalCorrelations)
# Select significant columns with relevant correlation.
significantCols <- names(finalCorrelations[abs(finalCorrelations) > 0.03])
print(significantCols)
aspectView[, result := cut(diffPercent, c(-100, 0, 100), c("sell", "buy"))]
selectColsFiltered <- c("result", significantCols[significantCols != "diffPercent"])
aspectViewFiltered <- aspectView[, ..selectColsFiltered]
trainIndex <- createDataPartition(aspectViewFiltered$result, p = 0.70, list = FALSE)
aspectViewTrain <- aspectViewFiltered[trainIndex,]
aspectViewTest <- aspectViewFiltered[-trainIndex,]
#linearModel <- lm(diffPercent ~ JU.y + sp.x, data = aspectViewTrain)
#summary(linearModel)
control <- trainControl(
method = "repeatedcv",
number = 10,
repeats = 1,
search = "random",
allowParallel = T
)
tree1 = train(
formula(result ~ .),
data = aspectViewTrain,
method = "rf",
metric = "Accuracy",
tuneLength = 10,
ntree = 100,
trControl = control,
importance = F
)
#summary(tree1)
# effect_p <- tree1 %>% predict(newdata = aspectViewTrain)
# Prediction results on train.
#table(
# actualclass = aspectViewTrain$result,
# predictedclass = effect_p
#) %>%
# confusionMatrix() %>%
# print()
effect_p <- tree1 %>% predict(newdata = aspectViewTest)
# Prediction results on test.
table(
actualclass = aspectViewTest$result,
predictedclass = effect_p
) %>%
confusionMatrix() %>%
print()
#saveRDS(tree1, "./models/LINK_MO_general_rf4.rds")
selectCols2 <- selectCols[selectCols != "result"]
futureAspects <- dailyAspects[Date >= as.Date("2020-08-20") & p.x == "MO",]
futureAspectsFeatures <- futureAspects[, ..selectCols2]
futureAspectsFeatures <- futureAspects[, lapply(.SD, sum), by = Date, .SDcols = aspectsCols]
effect_p <- tree1 %>% predict(newdata = futureAspectsFeatures)
#futureAspects$effect_p <- mapvalues(effect_p, from = c("sell", "buy"), to = c(0, 1))
futureAspectsFeatures$effect_p <- effect_p
marketPrediction <- futureAspectsFeatures[, c('Date', "effect_p")]
setnames(marketPrediction, c('Date', 'Action'))
fwrite(marketPrediction[Date <= Sys.Date() + 60], paste("./predictions/ml", symbol, "daily.csv", sep = "-"))