-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathSimplePrediction.R
51 lines (39 loc) · 1.46 KB
/
SimplePrediction.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
library(rpart)
library(rpart.plot)
library(DMwR)
#Loading Training Data
#Dataset citibike.train
pre1 = read.csv(file = file.choose(), header = T, sep = ",",
stringsAsFactors = F)
#Dataset 100A W/ Ans
pre2 = read.csv(file = file.choose(), header = T, sep = ",",
stringsAsFactors = F)
#Merged
train = merge(pre1,pre2,all.x=T)
plot(train$birth.year,train$tripduration)
summary(train$tripduration)
summary(train$birth.year)
model1 = rpart(tripduration~birth.year, data=train, minsplit=1, minbucket=1, cp=0.001)
model1
rpart.plot(model1)
#10000A Data Load
dA = read.csv(file = file.choose(), header = T, sep = ",",
stringsAsFactors = F)
dAW = read.csv(file = file.choose(), header = T, sep = ",",
stringsAsFactors = F)
#10000A Prediction and Errors
pred1 = predict(model1, dA)
pred1
DMwR::regr.eval(pred1,dAW$tripduration)
out = data.frame(Predictions = pred2)
write.csv(out, row.names = FALSE, file="C:/Users/bshah/OneDrive/Documents/RWorkspace/PredA.csv")
#10000B Predictions
train2 = merge(train, dAW,all.x=T)
model2 = rpart(tripduration~birth.year, data=train2, minsplit=1, minbucket=1, cp=0.001)
#10000B Data Load
dB = read.csv(file = file.choose(), header = T, sep = ",",
stringsAsFactors = F)
#10000B Prediction and Errors
pred2 = predict(model2, dB)
output = data.frame(Predictions = pred2)
write.csv(output, row.names = FALSE, file="C:/Users/bshah/OneDrive/Documents/RWorkspace/PredB.csv")