1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
|
#!/bin/python3
import sys
import matplotlib.pyplot as plt
from dataset import Dataset
def house_hist(ax, d, house_name):
h = d.df[d.df["house"] == house_name]
scores = h.loc[:, "arithmancy":"flying"]
x = (scores - scores.min()) / (scores.max() - scores.min())
ax.hist(x.values.flatten(), bins=40, rwidth=0.8)
ax.set_title(house_name)
if __name__ == "__main__":
if len(sys.argv) != 2:
raise "Usage: {} dataset_path".format(sys.argv[0])
d = Dataset(sys.argv[1])
fig, axs = plt.subplots(2, 2, sharey=True, tight_layout=True)
house_hist(axs[0][0], d, "Gryffindor")
house_hist(axs[0][1], d, "Slytherin")
house_hist(axs[1][0], d, "Ravenclaw")
house_hist(axs[1][1], d, "Hufflepuff")
plt.show()
|