This repository has been archived by the owner on May 6, 2021. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 16
/
Copy pathdatamodel.py
99 lines (84 loc) · 4.94 KB
/
datamodel.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
from settings import target_metric_name, target_knob_set
from controller import metric_set, knob_set
import numpy as np
import time
class GPDataSet:
#dataset for gpmodel
def __init__(self):
self.previous_timestamp = None
self.previous_rowlabels = None # [1...num_of_samples]
self.previous_knob_set = None # correspond to mapped_workload_knob_dataset [num of samples * num of knobs]
self.previous_metric_set = None # correspond to mapped_workload_metric_dataset [num of samples * num of metrics]
# value of metric/knob #j in sample *i
# we assume all workloads are in the same type (leave out workload mapping)
self.knob_labels = None # name of target knobs
self.target_metric = None # name of target metric
self.target_lessisbetter = None # whether less value of target metric is better
self.metric_labels = None # name of all related metrics
#self.important_knobs = None # we assume all selected knobs are important (leave out clustering)
#self.target_knobs = None # name of target knobs
self.new_timestamp = None
self.new_rowlabels = None # [1]
self.new_knob_set = None # [num of knobs]
self.new_metric_set = None # [num of metrics]
# value of metric/knob #j in sample *i
self.num_knobs = None
self.num_metrics = None
self.num_previousamples = None
def add_new_data(self, new_knob_list, new_metric_list):
self.new_timestamp = time.strftime("%Y-%m-%d %H:%M:%S", time.localtime())
self.new_knob_set = new_knob_list
self.new_metric_set = new_metric_list
def merge_new_data(self):
self.previous_metric_set = np.vstack((self.previous_metric_set, self.new_metric_set))
self.previous_knob_set = np.vstack((self.previous_knob_set, self.new_knob_set))
self.num_previousamples+=1
self.previous_rowlabels = np.array([x + 1 for x in range(self.num_previousamples)])
self.previous_timestamp.append(self.new_timestamp)
def initdataset(self, metric_list):
self.num_knobs = len(target_knob_set)
self.num_metrics = len(metric_list)
self.num_previousamples = 0
self.knob_labels = np.array([x for x in target_knob_set])
self.metric_labels = np.array([x for x in metric_list])
self.previous_rowlabels = np.array([x+1 for x in range(self.num_previousamples)])
self.previous_timestamp = [" " for x in range(self.num_previousamples)]
self.previous_knob_set = np.zeros([self.num_previousamples, self.num_knobs])
self.previous_metric_set = np.zeros([self.num_previousamples, self.num_metrics])
self.new_rowlabels = [1]
self.new_timestamp = " "
self.new_knob_set = np.zeros([1, self.num_knobs])
self.new_metric_set = np.zeros([1, self.num_metrics])
self.target_metric = target_metric_name
#self.target_knobs = target_knob_set
self.target_lessisbetter = metric_set[target_metric_name]['lessisbetter']
def printdata(self):
print("################## data ##################")
print("------------------------------previous:------------------------------")
print("rowlabels, finish_time, knobs, metrics")
for i in range(self.num_previousamples):
print(self.previous_rowlabels[i], ',', self.previous_timestamp[i], ',', self.previous_knob_set[i], ',', self.previous_metric_set[i])
print("------------------------------new:------------------------------")
print("knobs: ", self.new_knob_set)
print("metrics: ", self.new_metric_set)
print("rowlabels: ", self.new_rowlabels)
print("timestamp: ", self.new_timestamp)
print("------------------------------TARGET:------------------------------")
print("knob: ", self.knob_labels)
print("metric: ", self.target_metric)
print("metric_lessisbetter: ", self.target_lessisbetter)
print("------------------------------------------------------------")
print("num of knobs == ", self.num_knobs)
print("knobs: ", self.knob_labels)
print("num of metrics == ", self.num_metrics)
print("metrics: ", self.metric_labels)
print("------------------------------------------------------------")
print("################## data ##################")
def dat2xls(self):
print("################## data ##################")
for i in range(self.num_previousamples):
print(float(self.previous_knob_set[i]), end=', ')
for j in (self.previous_metric_set[i]):
print(float(j), end=', ')
print("")
print("################## data ##################")