-
Notifications
You must be signed in to change notification settings - Fork 1
/
baseline.py
36 lines (33 loc) · 910 Bytes
/
baseline.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
# -*- coding: utf-8 -*-
'@author: Zhengkun Yao'
import pandas as pd
import numpy as np
def getbaseline(data, data1):
#data = pd.read_csv('data_files/y_train.csv')
#data1=pd.read_csv('data_files/X_train.csv')
#a = data[['Sales']]
#m = data1[['Sales']]
a = data[:,3]
m = data1[:,3]
stu1 = np.array(a)
#print(stu1)
b=len(a)
sum=0
#print('lenth:',b)
for i in stu1:
sum=sum+i
#print('total:',sum)
average=sum/b
#print('average:',average)
c=len(m)
list=[]
for i in range(c):
list.append(average)
array1=np.array(list)
#print(array1)
return array1
if __name__ == "__main__":
'''
This will not be run when imported to another library only if run from this one itself.
'''
a=getbaseline(pd.read_csv('data_files/y_train.csv'), pd.read_csv('data_files/X_train.csv'))