[50a3f7]: / modules / VectorSpace / word2vec / tokenToken.py

Download this file

41 lines (32 with data), 836 Bytes

 1
 2
 3
 4
 5
 6
 7
 8
 9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
import pandas as pd
import scipy as sp
import math
import numpy as np
a = [[]]
df = pd.read_csv("/home/skjena/data/testData/fold_1.csv")
numOfCols = len(df.columns)
numOfRows = len(df)
b = np.zeros((numOfRows, numOfRows, numOfRows))
df2 = df[df.columns.difference(['CANCERS'])]
a = np.zeros((numOfRows, numOfRows))
def getColumn(i):
global df2
return df2.iloc[:,i]
def populateTwo(k) :
global a, df2
for i in range (numOfRows) :
for j in range (numOfRows) :
if i == j:
a[i][j] = 0
else :
d = getColumn(k)
#print(d)
a[i][j] = d[i]
def main () :
global a, df2, b
for k in range (numOfRows) :
populateTwo(k)
b[k] = a
print(b[2])
if __name__ == '__main__':
main()