--- a
+++ b/test/mayosrs/read_data.py
@@ -0,0 +1,107 @@
+import os
+import sys
+from collections import defaultdict
+import glob
+import datetime
+import re
+import random
+
+
+thisdir = os.path.dirname(os.path.abspath(__file__))
+datadir = os.path.join(thisdir, 'data')
+
+
+def main():
+    srs = get_srs()
+    print(srs)
+
+
+def get_srs():
+    srs = _get_srs()
+    srs_mini = _get_srs_mini()
+    full = {}
+    full.update(srs)
+    full.update(srs_mini)
+    return full
+
+
+def get_srs_cui():
+    srs = _get_srs_cui()
+    srs_mini = _get_srs_mini_cui()
+    full = {}
+    full.update(srs)
+    full.update(srs_mini)
+    return full
+
+
+def _get_srs():
+    X, Y = [], []
+    filename = os.path.join(datadir, 'MayoSRS.csv')
+    with open(filename, 'r') as f:
+        lines = f.readlines()
+        for line in lines[1:]:
+            toks = line.strip().split(',')
+            score = float(toks[0])
+            phrase1 = toks[3].strip('"').lower()
+            phrase2 = toks[4].strip('"').lower()
+            X.append((phrase1, phrase2))
+            Y.append(score)
+    scores = {'srs': (X, Y)}
+    return scores
+
+
+def _get_srs_cui():
+    X, Y = [], []
+    filename = os.path.join(datadir, 'MayoSRS.csv')
+    with open(filename, 'r') as f:
+        lines = f.readlines()
+        for line in lines[1:]:
+            toks = line.strip().split(',')
+            score = float(toks[0])
+            cui1 = toks[1].strip('"')
+            cui2 = toks[2].strip('"')
+            X.append((cui1, cui2))
+            Y.append(score)
+    scores = {'srs': (X, Y)}
+    return scores
+
+
+def _get_srs_mini():
+    X, physician_Y, coder_Y = [], [], []
+    filename = os.path.join(datadir, 'MiniMayoSRS.csv')
+    with open(filename, 'r') as f:
+        lines = f.readlines()
+        for line in lines[1:]:
+            toks = line.strip().split(',')
+            physician_score = float(toks[0])
+            coder_score = float(toks[1])
+            phrase1 = toks[4].strip('"').lower()
+            phrase2 = toks[5].strip('"').lower()
+            X.append((phrase1, phrase2))
+            physician_Y.append(physician_score)
+            coder_Y.append(coder_score)
+    scores = {'mini_physician': (X, physician_Y), 'mini_coder': (X, coder_Y)}
+    return scores
+
+
+def _get_srs_mini_cui():
+    X, physician_Y, coder_Y = [], [], []
+    filename = os.path.join(datadir, 'MiniMayoSRS.csv')
+    with open(filename, 'r') as f:
+        lines = f.readlines()
+        for line in lines[1:]:
+            toks = line.strip().split(',')
+            physician_score = float(toks[0])
+            coder_score = float(toks[1])
+            cui1 = toks[2].strip('"')
+            cui2 = toks[3].strip('"')
+            X.append((cui1, cui2))
+            physician_Y.append(physician_score)
+            coder_Y.append(coder_score)
+    scores = {'mini_physician': (X, physician_Y), 'mini_coder': (X, coder_Y)}
+    return scores
+
+
+if __name__ == '__main__':
+    main()
+    print(get_srs_cui())