Diff of /datasets.py [000000] .. [0037e2]

Switch to unified view

a b/datasets.py
1
# -*- coding: utf-8 -*-
2
"""Untitled39.ipynb
3
4
Automatically generated by Colab.
5
6
Original file is located at
7
    https://colab.research.google.com/drive/1pcHOb70S4TwkxIKgrNTFfLdc71vMgOKg
8
"""
9
10
import torch
11
import time
12
import evaluate
13
import pandas as pd
14
import numpy as np
15
from transformers import DataCollatorForSeq2Seq
16
17
18
from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
19
from transformers import Seq2SeqTrainingArguments, DataCollatorForSeq2Seq, Seq2SeqTrainer
20
#from datasets import load_dataset
21
22
from google.colab import drive
23
drive.mount('/content/drive')
24
25
import os
26
folder_path = '/content/drive/My Drive/nosocomial/hapi'
27
os.chdir(folder_path)
28
print("Current Directory:", os.getcwd())
29
30
hapi_trainLabels = pd.read_csv('train.labels.csv')
31
hapi_trainChronologies=pd.read_csv('train.chronologies.csv')
32
hapi_trainLabels=pd.read_csv('train.labels.csv')
33
hapi_develAdmittimes=pd.read_csv('devel.admittimes.csv')
34
hapi_develChronologies=pd.read_csv('devel.chronologies.csv')
35
hapi_develLabels=pd.read_csv('devel.labels.csv')
36
hapi_negativeLabels=pd.read_csv('negative_labels.csv')
37
hapi_testAdmittimes=pd.read_csv('test.admittimes.csv')
38
hapi_testchronologies=pd.read_csv('test.chronologies.csv')
39
hapi_testLabels =pd.read_csv('test.labels.csv')
40
hapi_testChronologies =pd.read_csv('test.chronologies.csv')
41
hapi_testLabels =pd.read_csv('test.labels.csv')
42
43
haki_trainLabels = pd.read_csv('train.labels.csv')
44
haki_trainChronologies=pd.read_csv('train.chronologies.csv')
45
haki_trainLabels=pd.read_csv('train.labels.csv')
46
haki_develAdmittimes=pd.read_csv('devel.admittimes.csv')
47
haki_develChronologies=pd.read_csv('devel.chronologies.csv')
48
haki_develLabels=pd.read_csv('devel.labels.csv')
49
haki_negativeLabels=pd.read_csv('negative_labels.csv')
50
haki_testAdmittimes=pd.read_csv('test.admittimes.csv')
51
haki_testchronologies=pd.read_csv('test.chronologies.csv')
52
haki_testLabels =pd.read_csv('test.labels.csv')
53
haki_testChronologies =pd.read_csv('test.chronologies.csv')
54
haki_testLabels =pd.read_csv('test.labels.csv')
55
56
haa_trainLabels = pd.read_csv('train.labels.csv')
57
haa_trainChronologies=pd.read_csv('train.chronologies.csv')
58
haa_develAdmittimes=pd.read_csv('devel.admittimes.csv')
59
haa_develChronologies=pd.read_csv('devel.chronologies.csv')
60
haa_develLabels=pd.read_csv('devel.labels.csv')
61
haa_negativeLabels=pd.read_csv('negative_labels.csv')
62
haa_testAdmittimes=pd.read_csv('test.admittimes.csv')
63
haa_testchronologies=pd.read_csv('test.chronologies.csv')
64
haa_testLabels =pd.read_csv('test.labels.csv')
65
haa_testChronologies =pd.read_csv('test.chronologies.csv')
66
haa_testLabels =pd.read_csv('test.labels.csv')
67
68
69
70
"""####  HAA    C0002871 (Anemia)   anemia, anaemia, HAA    WHO[19]"""
71
72
haa_trainChronologies.head()
73
74
haa_trainChronologies.head()
75
76
haa_develAdmittimes.head()
77
78
haa_develChronologies.head()
79
80
81
82
83