diff options
Diffstat (limited to 'src/histogram.py')
| -rwxr-xr-x | src/histogram.py | 28 |
1 files changed, 28 insertions, 0 deletions
diff --git a/src/histogram.py b/src/histogram.py new file mode 100755 index 0000000..1200233 --- /dev/null +++ b/src/histogram.py @@ -0,0 +1,28 @@ +#!/bin/python3 + +import sys + +import matplotlib.pyplot as plt + +from dataset import Dataset + + +def house_hist(ax, d, house_name): + h = d.df[d.df["house"] == house_name] + scores = h.loc[:, "arithmancy":"flying"] + x = (scores - scores.min()) / (scores.max() - scores.min()) + ax.hist(x.values.flatten(), bins=40, rwidth=0.8) + ax.set_title(house_name) + +if __name__ == "__main__": + if len(sys.argv) != 2: + raise "Usage: {} dataset_path".format(sys.argv[0]) + d = Dataset(sys.argv[1]) + + fig, axs = plt.subplots(2, 2, sharey=True, tight_layout=True) + house_hist(axs[0][0], d, "Gryffindor") + house_hist(axs[0][1], d, "Slytherin") + house_hist(axs[1][0], d, "Ravenclaw") + house_hist(axs[1][1], d, "Hufflepuff") + plt.show() + |
