Diff of /plot.py [000000] .. [48f029]

Switch to side-by-side view

--- a
+++ b/plot.py
@@ -0,0 +1,38 @@
+import preprocessing
+import matplotlib.pyplot as plt
+import seaborn as sns
+sns.set(style="ticks", color_codes=True)
+sns.set_style("whitegrid")
+sns.set_context("poster")
+
+
+def show_data():
+    """
+    Plots features pairwise, of the following set:
+    - average allelic fraction
+    - hematocrit
+    - platelet
+    - white blood cell count
+    - hemoglobin
+    - age
+    """
+
+    # Preprocessing
+    aml_data = preprocessing.load_csv()
+    preprocessing.fill_missing_values(aml_data)
+    preprocessing.add_total_genes(aml_data)
+
+    # Delete gene columns
+    for column in aml_data.columns:
+        if 'Gene.' in column:
+            del aml_data[column]
+
+    # Plot pairwise
+    sns.set(style='whitegrid')
+    cols = ['caseflag', 'Total.Genes', 'Age', 'WBC', 'PLATELET', 'HEMOGLBN', 'HEMATOCR']
+    sns.pairplot(aml_data[cols],
+                 hue='caseflag',  # different caseflags have different colors
+                 markers=['.', r'$+$'],  # markers
+                 plot_kws={"s": 250},  # marker size (100 default)
+                 size=5.0)  # size of each subplot
+    plt.show()