-
Notifications
You must be signed in to change notification settings - Fork 0
/
Coal Plant.R
122 lines (63 loc) · 2.06 KB
/
Coal Plant.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
machine = read.csv(file.choose())
head(machine)
str(machine)
summary(machine)
#drive utilization coln
machine$utilization = 1 - machine$Percent.Idle
#handling date time in R
as.POSIXct(machine$Timestamp, format = "%d/%m/%Y %H:%M")
# add new coln in dataset
machine$PosixTime = as.POSIXct(machine$Timestamp, format = "%d/%m/%Y %H:%M")
head(machine)
# reaarange coln in datset
machine$Timestamp = NULL
machine = machine[,c(4,1,2,3)]
#lists are usefull in subsetting like below
RL1 = machine[machine$Machine =="RL1",]
summary(RL1)
RL1$Machine = factor(RL1$Machine)
#CONSTRUCT THE LIST
machine_stats_rl1 = c(min(RL1$utilization, na.rm = T),
mean(RL1$utilization, na.rm = T),
max(RL1$utilization, na.rm = T))
machine_stats_rl1
# utilization under 90%
length(which(RL1$utilization < 0.90))
machine_under_90_flag = length(which(RL1$utilization < 0.90))
list_rl1 = list("RL1", machine_stats_rl1,machine_under_90_flag)
list_rl1
#naming component of lists
names(list_rl1) #checking names
names(list_rl1) = c("machinetype", "stats","lowthreshold")
list_rl1
list_rl1$machinetype
#vector : all hours where utilization in unknown
list_rl1$unknownhrs = RL1[is.na(RL1$utilization),"PosixTime"]
list_rl1$unknownhrs
#remove a component
list_rl1[4] = NULL
list_rl1[5] = NULL
list_rl1[6] = NULL
list_rl1[7] = NULL
#dataframe for the machine
list_rl1$data = RL1
list_rl1
summary(list_rl1)
#subsetting list
list_rl1[[4]][1]
list_rl1$unknownhrs[1]
list_rl1[1:3]
list_rl1[c(1,4)]
sublist_rl1 = list_rl1[c("machinename","stats")]
sublist_rl1
sublist_rl1[[2]][1]
#building the time series plot
p = ggplot(data = machine)
p+ geom_line(aes(x = PosixTime,y = utilization, colour = Machine), size = 1.2) +
facet_grid(Machine~.) +
geom_hline(yintercept = 0.90, colour ="Gray", size =1.2, linetype =3)
machineplot = p+ geom_line(aes(x = PosixTime,y = utilization, colour = Machine), size = 1.2) +
facet_grid(Machine~.) +
geom_hline(yintercept = 0.90, colour ="Gray", size =1.2, linetype =3)
list_rl1$plot = machineplot
list_rl1