-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathstats.py
75 lines (57 loc) · 1.7 KB
/
stats.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
import pandas as pd
from scipy import stats
data = '''Region,Alcohol,Tobacco
North, 6.47, 4.03
Yorkshire, 6.13, 3.76
Northeast, 6.19, 3.77
East Midlands, 4.89, 3.34
West Midlands, 5.63, 3.47
East Anglia, 4.52, 2.92
Southeast, 5.89, 3.20
Southwest, 4.79, 2.71
Wales, 5.27, 3.53
Scotland, 6.08, 4.51
Northern Ireland, 4.02, 4.56'''
data = data.splitlines()
data = [i.split(',') for i in data]
column_names = data[0]
data_rows = data[1::]
df = pd.DataFrame(data_rows, columns=column_names)
df['Alcohol'] = df['Alcohol'].astype(float)
df['Tobacco'] = df['Tobacco'].astype(float)
print "The mean for the Alcohol dataset is: "
print df['Alcohol'].mean()
print "\n"
print "The median for the Alcohol dataset is: "
print df['Alcohol'].median()
print "\n"
print "The mode for the Alcohol dataset is: "
print ' '.join(map(str, stats.mode(df['Alcohol'])[0]))
print "\n"
print "The range for the Alcohol dataset is: "
print max(df['Alcohol']) - min(df['Alcohol'])
print "\n"
print "The variance for the Alcohol dataset is: "
print df['Alcohol'].var()
print "\n"
print "The standard deviation for the Alcohol dataset is: "
print df['Alcohol'].std()
print "\n"
print "The mean for the Tobacco dataset is: "
print df['Tobacco'].mean()
print "\n"
print "The median for the Tobacco dataset is: "
print df['Tobacco'].median()
print "\n"
print "The mode for the Tobacco dataset is: "
print ' '.join(map(str, stats.mode(df['Tobacco'])[0]))
print "\n"
print "The range for the Tobacco dataset is: "
print max(df['Tobacco']) - min(df['Tobacco'])
print "\n"
print "The variance for the Tobacco dataset is: "
print df['Tobacco'].var()
print "\n"
print "The standard deviation for the Tobacco dataset is: "
print df['Tobacco'].std()
print "\n"