Switch to side-by-side view

--- a
+++ b/development/qa-server/Fnetune_models_compare.ipynb
@@ -0,0 +1 @@
+{"nbformat":4,"nbformat_minor":0,"metadata":{"colab":{"name":"Fnetune_models_compare.ipynb","provenance":[],"collapsed_sections":[]},"kernelspec":{"name":"python3","display_name":"Python 3"},"language_info":{"name":"python"},"accelerator":"GPU"},"cells":[{"cell_type":"code","metadata":{"id":"CcJoBmV-Jh84"},"source":["!pip install transformers[sentencepiece] spacy rouge"],"execution_count":null,"outputs":[]},{"cell_type":"code","metadata":{"id":"sAAcKPcjuvw4"},"source":["!nvidia-smi"],"execution_count":null,"outputs":[]},{"cell_type":"code","metadata":{"id":"FA_vVNqQJonA"},"source":["!python -m spacy download en_core_web_lg"],"execution_count":null,"outputs":[]},{"cell_type":"code","metadata":{"id":"7DDkPtP1JqWr","executionInfo":{"status":"ok","timestamp":1632404455171,"user_tz":-210,"elapsed":7974,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}}},"source":["import torch\n","import re\n","import spacy\n","import nltk\n","import json\n","import en_core_web_lg\n","import pandas as pd\n","from tqdm import tqdm\n","from rouge import Rouge \n","from nltk.translate.bleu_score import sentence_bleu, SmoothingFunction\n","from transformers import AutoModelForMaskedLM, AutoModel, AutoTokenizer, pipeline"],"execution_count":5,"outputs":[]},{"cell_type":"code","metadata":{"id":"uHlKEnVyJvgd"},"source":["nlp = en_core_web_lg.load()\n","nltk.download('punkt')"],"execution_count":null,"outputs":[]},{"cell_type":"code","metadata":{"id":"9XFoBomznoWR"},"source":["from google.colab import drive\n","drive.mount('/content/drive')"],"execution_count":null,"outputs":[]},{"cell_type":"code","metadata":{"id":"HJpeVY414JNx"},"source":["cd /content/drive/My Drive/"],"execution_count":null,"outputs":[]},{"cell_type":"code","metadata":{"id":"LxHglW4z4L-I"},"source":["!ls"],"execution_count":null,"outputs":[]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"giOXiAl3Jvz7","executionInfo":{"status":"ok","timestamp":1632404644304,"user_tz":-210,"elapsed":22,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"c74547b6-1c70-4fc2-e39e-fdbb5fa1675c"},"source":["cd /content/drive/My Drive/Dataset/"],"execution_count":15,"outputs":[{"output_type":"stream","name":"stdout","text":["/content/drive/My Drive/Dataset\n"]}]},{"cell_type":"code","metadata":{"id":"2CrMRVKNu8cW"},"source":["!gdown https://drive.google.com/uc?id=1wBD5codLeDD8iEBIe_pnTHqQr4hqLsqi"],"execution_count":null,"outputs":[]},{"cell_type":"code","metadata":{"id":"hek-cOHHvFus"},"source":["!gdown https://drive.google.com/uc?id=1mj79A-lAVYIWXtvDKUTslyIjPvyHi2MJ"],"execution_count":null,"outputs":[]},{"cell_type":"code","metadata":{"id":"urhqR1nTKw3U","executionInfo":{"status":"ok","timestamp":1632404917708,"user_tz":-210,"elapsed":379,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}}},"source":["f = open ('/content/drive/MyDrive/Dataset/qa_multi_answer.json', \"r\")\n","qa = json.loads(f.read())"],"execution_count":19,"outputs":[]},{"cell_type":"code","metadata":{"id":"Ssq5_8g5UB4P"},"source":["qa['data'][0]"],"execution_count":null,"outputs":[]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"zIuyVTgSvVCX","executionInfo":{"status":"ok","timestamp":1632404920327,"user_tz":-210,"elapsed":13,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"6459bfe5-bd20-42c3-9c3a-39b4591e0aa4"},"source":["cd /content/drive/My Drive/base_bert/final_base_bert_QA_checkpoint"],"execution_count":21,"outputs":[{"output_type":"stream","name":"stdout","text":["/content/drive/My Drive/base_bert/final_base_bert_QA_checkpoint\n"]}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"ElNw4nJLvgnL","executionInfo":{"status":"ok","timestamp":1632404921026,"user_tz":-210,"elapsed":351,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"3f9afb06-1bad-42e3-c16c-249a2abe9dc5"},"source":["!ls"],"execution_count":22,"outputs":[{"output_type":"stream","name":"stdout","text":["config.json\t\t pytorch_model.bin\t  training_args.bin\n","nbest_predictions_.json  special_tokens_map.json  vocab.txt\n","predictions_.json\t tokenizer_config.json\n"]}]},{"cell_type":"code","metadata":{"id":"bi-y2iGAvQ6G","executionInfo":{"status":"ok","timestamp":1632411140516,"user_tz":-210,"elapsed":556,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}}},"source":["n_top = 3\n","rouge = Rouge()\n","smoothie = SmoothingFunction().method4\n","bleu_scores = []\n","rouge1_scores = []\n","rouge2_scores = []\n","rougel_scores = []\n","\n","\n","model_names = {'/content/drive/My Drive/2_squeeze/Final_squeeze-squad':'question_answering',\n","               '/content/drive/My Drive/2_squeeze/Squeeze-bert_MLM/MLM_output_dir/Final_squeeze_MLM':'question_answering',\n","               '/content/drive/My Drive/Squeeze/QA_Squeeze_Squad/squeeze-bert-squad-QA':'question_answering',\n","               '/content/drive/My Drive/base_bert/final_base_bert_QA_checkpoint':'question_answering',\n","               '/content/drive/My Drive/base_bert/MLM_base_bert':'question_answering',\n","               '/content/drive/My Drive/base_bert/QA_base_bert/base_bert_QA_Final':'question_answering'\n","               }"],"execution_count":63,"outputs":[]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"O4_nFkNL69y3","executionInfo":{"status":"ok","timestamp":1632405512915,"user_tz":-210,"elapsed":28,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"7eeb1a3c-eb28-4c61-b1dd-a1e51a825c38"},"source":["cd /content/drive/My Drive/Squeeze/QA_Squeeze_Squad/squeeze-bert-squad-QA"],"execution_count":50,"outputs":[{"output_type":"stream","name":"stdout","text":["/content/drive/My Drive/Squeeze/QA_Squeeze_Squad/squeeze-bert-squad-QA\n"]}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"RbIc_B9k7GrI","executionInfo":{"status":"ok","timestamp":1632405512919,"user_tz":-210,"elapsed":21,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"3dd70b5b-2115-4bd8-90b5-1d5e955ed3f7"},"source":["cd /content/drive/My Drive/base_bert/QA_base_bert"],"execution_count":51,"outputs":[{"output_type":"stream","name":"stdout","text":["/content/drive/My Drive/base_bert/QA_base_bert\n"]}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"GOCF21al7BWn","executionInfo":{"status":"ok","timestamp":1632405513333,"user_tz":-210,"elapsed":22,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"5622db13-b470-4d79-a43e-16c2e1c9bd04"},"source":["!ls\n"],"execution_count":52,"outputs":[{"output_type":"stream","name":"stdout","text":["base_bert_QA_Final  base_bert_QA_final.zip\n"]}]},{"cell_type":"code","metadata":{"id":"8wi60ZiZLRT0","executionInfo":{"status":"ok","timestamp":1632405513763,"user_tz":-210,"elapsed":9,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}}},"source":["class SentenceSimilarity():\n","    def __init__(self, model_name=None, device='cuda'):\n","        self.tokenizer = AutoTokenizer.from_pretrained(model_name)\n","        self.model = AutoModel.from_pretrained(model_name).eval()\n","\n","    def __call__(self, text):\n","        tokens = self.tokenizer(text, padding=True, return_tensors='pt', truncation=True)\n","        with torch.no_grad():\n","            embeddings = self.model(**tokens).last_hidden_state\n","\n","        mask = tokens['attention_mask'].unsqueeze(-1).expand(embeddings.shape).float()\n","        sentence_embeddings = torch.sum(embeddings * mask, dim=1) / torch.clamp(mask.sum(1), min=1e-9) \n","        return sentence_embeddings\n","\n","    def compute_label_embedding(self, labels):\n","        self.label_embeds = self(labels)\n","    \n","    def similarity(self, example):\n","        return torch.cosine_similarity(self(example), self.label_embeds).tolist()"],"execution_count":53,"outputs":[]},{"cell_type":"code","metadata":{"id":"VUPsEEr9LUFb","executionInfo":{"status":"ok","timestamp":1632405514712,"user_tz":-210,"elapsed":9,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}}},"source":["def get_answer(sentences, question, model, model_type, n_top=None):\n","  if model_type == 'similarity':\n","    scores = model.similarity(question)\n","    dic = {}\n","\n","    for i, ex in enumerate(sentences):\n","        dic[ex] = scores[i]\n","\n","    s = pd.Series(dic, name='Similarity')\n","    s.index.name = 'Sentences'\n","    df = s.reset_index()\n","    df.sort_values(by='Similarity', ascending=False, inplace=True)\n","    answer = \" \".join(df.iloc[:n_top]['Sentences'])\n","\n","  elif model_type == 'question_answering':\n","    context = \" \".join(sentences)\n","    answer = model(question=question, context=context)['answer']\n","\n","  return answer"],"execution_count":54,"outputs":[]},{"cell_type":"code","metadata":{"id":"NW6RmKZGLcCf","executionInfo":{"status":"ok","timestamp":1632405515346,"user_tz":-210,"elapsed":9,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}}},"source":["def get_score(token_reference, token_candidate, sf):\n","  bleu_score = sentence_bleu(token_reference, token_candidate, smoothing_function=sf, weights=(1, 0, 0, 0))\n","  rouge_score = rouge.get_scores(candidate, reference)\n","  return bleu_score, rouge_score[0]['rouge-1']['f'], rouge_score[0]['rouge-2']['f'], rouge_score[0]['rouge-l']['f']"],"execution_count":55,"outputs":[]},{"cell_type":"code","metadata":{"id":"Q07h24hZLesx","executionInfo":{"status":"ok","timestamp":1632405515797,"user_tz":-210,"elapsed":8,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}}},"source":["def load_model(model_name, model_type):\n","  if model_type == 'similarity':\n","    model = SentenceSimilarity(model_name)\n","\n","  elif model_type == 'question_answering':\n","    model = pipeline(model=model_name, tokenizer=model_name, task=\"question-answering\")\n","    \n","  return model"],"execution_count":56,"outputs":[]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/","height":237},"id":"TYHoCqWyL3YO","executionInfo":{"status":"ok","timestamp":1632405516113,"user_tz":-210,"elapsed":14,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"b43bb064-c716-4daa-b0cd-e58ccc2780e1"},"source":["df = pd.DataFrame(columns=['Type', 'BLEU', 'ROUGE_1', 'ROUGE_2', 'ROUGE_l'], index=list(model_names.keys()))\n","df"],"execution_count":57,"outputs":[{"output_type":"execute_result","data":{"text/html":["<div>\n","<style scoped>\n","    .dataframe tbody tr th:only-of-type {\n","        vertical-align: middle;\n","    }\n","\n","    .dataframe tbody tr th {\n","        vertical-align: top;\n","    }\n","\n","    .dataframe thead th {\n","        text-align: right;\n","    }\n","</style>\n","<table border=\"1\" class=\"dataframe\">\n","  <thead>\n","    <tr style=\"text-align: right;\">\n","      <th></th>\n","      <th>Type</th>\n","      <th>BLEU</th>\n","      <th>ROUGE_1</th>\n","      <th>ROUGE_2</th>\n","      <th>ROUGE_l</th>\n","    </tr>\n","  </thead>\n","  <tbody>\n","    <tr>\n","      <th>/content/drive/My Drive/2_squeeze/Final_squeeze-squad</th>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","    </tr>\n","    <tr>\n","      <th>/content/drive/My Drive/2_squeeze/Squeeze-bert_MLM/MLM_output_dir/Final_squeeze_MLM</th>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","    </tr>\n","    <tr>\n","      <th>/content/drive/My Drive/Squeeze/QA_Squeeze_Squad/squeeze-bert-squad-QA</th>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","    </tr>\n","    <tr>\n","      <th>/content/drive/My Drive/base_bert/final_base_bert_QA_checkpoint</th>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","    </tr>\n","    <tr>\n","      <th>/content/drive/My Drive/base_bert/MLM_base_bert</th>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","    </tr>\n","    <tr>\n","      <th>/content/drive/My Drive/base_bert/QA_base_bert</th>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","    </tr>\n","  </tbody>\n","</table>\n","</div>"],"text/plain":["                                                   Type BLEU  ... ROUGE_2 ROUGE_l\n","/content/drive/My Drive/2_squeeze/Final_squeeze...  NaN  NaN  ...     NaN     NaN\n","/content/drive/My Drive/2_squeeze/Squeeze-bert_...  NaN  NaN  ...     NaN     NaN\n","/content/drive/My Drive/Squeeze/QA_Squeeze_Squa...  NaN  NaN  ...     NaN     NaN\n","/content/drive/My Drive/base_bert/final_base_be...  NaN  NaN  ...     NaN     NaN\n","/content/drive/My Drive/base_bert/MLM_base_bert     NaN  NaN  ...     NaN     NaN\n","/content/drive/My Drive/base_bert/QA_base_bert      NaN  NaN  ...     NaN     NaN\n","\n","[6 rows x 5 columns]"]},"metadata":{},"execution_count":57}]},{"cell_type":"code","metadata":{"id":"b0xLodKEScO3"},"source":["# import numpy as np\n","\n","# for data in qa['data']:\n","#   context = data['context']\n","#   doc = nlp(context)\n","#   print(\"*************\")\n","#   print(context)\n","#   print(\"*************\")\n","#   sentences = [str(sentence) for sentence in list(doc.sents)]\n","\n","#   if model_type == 'similarity':\n","#     model.compute_label_embedding(sentences)\n","  \n","#   for q_a in data['qas']:\n","#     question = q_a['question']\n","#     reference = \"\".join(q_a['answers'])\n","\n","#     # if type(question) == list:\n","#     #   question = q_a['question'][0]\n","#     print(\"##################\")\n","#     print(question)\n","\n","#   break"],"execution_count":null,"outputs":[]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"4mHGKWNaLhJn","executionInfo":{"status":"ok","timestamp":1632416928837,"user_tz":-210,"elapsed":3146763,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"cb0f95f0-a610-44ed-8f72-81ace75fe134"},"source":["for model_name in tqdm(model_names):\n","  model_type = model_names[model_name]\n","  df['Type'][model_name] = model_type\n","\n","  model = load_model(model_name, model_type)\n","\n","  for data in qa['data']:\n","    context = data['context']\n","    doc = nlp(context)\n","    sentences = [str(sentence) for sentence in list(doc.sents)]\n","\n","    if model_type == 'similarity':\n","      model.compute_label_embedding(sentences)\n","    \n","    for q_a in data['qas']:\n","      question = q_a['question']\n","      if type(question) == list:\n","        question = q_a['question'][0]\n","\n","\n","      reference = \"\".join(q_a['answers'])\n","\n","      candidate = get_answer(sentences, question, model, model_type, n_top)\n","      token_reference = nltk.word_tokenize(reference)\n","      token_candidate = nltk.word_tokenize(candidate)\n","\n","      try :\n","        bleu_score, rouge1_score, rouge2_score, rougel_score = get_score(\n","            token_reference, token_candidate, smoothie)\n","\n","\n","        bleu_scores.append(bleu_score)\n","        rouge1_scores.append(rouge1_score)\n","        rouge2_scores.append(rouge2_score)\n","        rougel_scores.append(rougel_score)\n","      except:\n","        pass\n","      \n","\n","  df['BLEU'][model_name] = sum(bleu_scores)/len(bleu_scores)\n","  df['ROUGE_1'][model_name] = sum(rouge1_scores)/len(rouge1_scores)\n","  df['ROUGE_2'][model_name] = sum(rouge2_scores)/len(rouge2_scores)\n","  df['ROUGE_l'][model_name] = sum(rougel_scores)/len(rougel_scores)"],"execution_count":85,"outputs":[{"output_type":"stream","name":"stderr","text":[" 17%|█▋        | 1/6 [06:42<33:34, 402.89s/it]Some weights of the model checkpoint at /content/drive/My Drive/2_squeeze/Squeeze-bert_MLM/MLM_output_dir/Final_squeeze_MLM were not used when initializing SqueezeBertForQuestionAnswering: ['cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.decoder.bias', 'cls.predictions.transform.dense.bias']\n","- This IS expected if you are initializing SqueezeBertForQuestionAnswering from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n","- This IS NOT expected if you are initializing SqueezeBertForQuestionAnswering from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n","Some weights of SqueezeBertForQuestionAnswering were not initialized from the model checkpoint at /content/drive/My Drive/2_squeeze/Squeeze-bert_MLM/MLM_output_dir/Final_squeeze_MLM and are newly initialized: ['qa_outputs.weight', 'qa_outputs.bias']\n","You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n"," 67%|██████▋   | 4/6 [30:50<16:37, 498.65s/it]Some weights of the model checkpoint at /content/drive/My Drive/base_bert/MLM_base_bert were not used when initializing BertForQuestionAnswering: ['cls.predictions.transform.dense.weight', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.weight', 'cls.predictions.decoder.bias', 'cls.predictions.transform.dense.bias']\n","- This IS expected if you are initializing BertForQuestionAnswering from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n","- This IS NOT expected if you are initializing BertForQuestionAnswering from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n","Some weights of BertForQuestionAnswering were not initialized from the model checkpoint at /content/drive/My Drive/base_bert/MLM_base_bert and are newly initialized: ['qa_outputs.weight', 'qa_outputs.bias']\n","You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n","100%|██████████| 6/6 [52:25<00:00, 524.31s/it]\n"]}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"r-mdMYlmueV2","executionInfo":{"status":"ok","timestamp":1632418553204,"user_tz":-210,"elapsed":442,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"a95d53cd-f5f4-4208-8319-b7941831b412"},"source":["sum(bleu_scores)/len(bleu_scores)"],"execution_count":103,"outputs":[{"output_type":"execute_result","data":{"text/plain":["0.05994253804045497"]},"metadata":{},"execution_count":103}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"IA1feYAzR_Ps","executionInfo":{"status":"ok","timestamp":1632411062312,"user_tz":-210,"elapsed":549,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"d41fdc40-921f-43f4-ac4c-41d97fb8e0da"},"source":["cd /content/drive/My Drive/base_bert/QA_base_bert"],"execution_count":61,"outputs":[{"output_type":"stream","name":"stdout","text":["/content/drive/My Drive/base_bert/QA_base_bert\n"]}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"_43eg3ZkSBUi","executionInfo":{"status":"ok","timestamp":1632411068044,"user_tz":-210,"elapsed":519,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"a95dff10-ce7b-45bb-83c5-23ac3c917a87"},"source":["!ls"],"execution_count":62,"outputs":[{"output_type":"stream","name":"stdout","text":["base_bert_QA_Final  base_bert_QA_final.zip\n"]}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"9s6L9SbtrzG6","executionInfo":{"status":"ok","timestamp":1632417629132,"user_tz":-210,"elapsed":482,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"22d0ea41-3840-4ff8-a831-fc1624d057d8"},"source":["print(token_reference)"],"execution_count":86,"outputs":[{"output_type":"stream","name":"stdout","text":["['Metformin', 'should', 'not', 'be', 'given', 'to', 'a', 'child', 'younger', 'than', '10', 'years', 'old.Some', 'forms', 'of', 'metformin', 'are', 'not', 'approved', 'for', 'use', 'by', 'anyone', 'younger', 'than', '18', 'years', 'old', '.']\n"]}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"_U4TxAy7r6Uh","executionInfo":{"status":"ok","timestamp":1632417629667,"user_tz":-210,"elapsed":15,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"54fe61a4-217a-4c5b-cfa5-a8041c6b1bf4"},"source":["token_candidate"],"execution_count":87,"outputs":[{"output_type":"execute_result","data":{"text/plain":["['10']"]},"metadata":{},"execution_count":87}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"KvuP3F2xw7sG","executionInfo":{"status":"ok","timestamp":1632419203620,"user_tz":-210,"elapsed":449,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"fe92b165-682d-4a5d-fb04-ac672768069e"},"source":["df.columns"],"execution_count":109,"outputs":[{"output_type":"execute_result","data":{"text/plain":["Index(['Unnamed: 0', 'Type', 'BLEU', 'ROUGE_1', 'ROUGE_2', 'ROUGE_l'], dtype='object')"]},"metadata":{},"execution_count":109}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"GKkwvQccxIB2","executionInfo":{"status":"ok","timestamp":1632419401520,"user_tz":-210,"elapsed":436,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"ccbf1ca3-1dd6-4397-f016-9fced27ffcbc"},"source":["df['Unnamed: 0'][0],df['BLEU'][0],  df['ROUGE_1'][0], df['ROUGE_2'][0], df['ROUGE_l'][0]"],"execution_count":115,"outputs":[{"output_type":"execute_result","data":{"text/plain":["('/content/drive/My Drive/2_squeeze/Final_squeeze-squad',\n"," 0.045835349004110466,\n"," 0.19854756525977146,\n"," 0.14850040140960274,\n"," 0.19770246399303446)"]},"metadata":{},"execution_count":115}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"H_ueotwEwkfN","executionInfo":{"status":"ok","timestamp":1632419452165,"user_tz":-210,"elapsed":24,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"b065aa4d-7e6a-4a65-e4f1-37007906b3b7"},"source":["df['Unnamed: 0'][1],df['BLEU'][1],  df['ROUGE_1'][1], df['ROUGE_2'][1], df['ROUGE_l'][1]"],"execution_count":116,"outputs":[{"output_type":"execute_result","data":{"text/plain":["('/content/drive/My Drive/2_squeeze/Squeeze-bert_MLM/MLM_output_dir/Final_squeeze_MLM',\n"," 0.047861168051024916,\n"," 0.17696092711645833,\n"," 0.12715152845920613,\n"," 0.17566550960893856)"]},"metadata":{},"execution_count":116}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"NpXeMk5qyDdU","executionInfo":{"status":"ok","timestamp":1632419476306,"user_tz":-210,"elapsed":452,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"74f2b786-c496-4156-a31b-3972cb624934"},"source":["df['Unnamed: 0'][2],df['BLEU'][2],  df['ROUGE_1'][2], df['ROUGE_2'][2], df['ROUGE_l'][2]"],"execution_count":117,"outputs":[{"output_type":"execute_result","data":{"text/plain":["('/content/drive/My Drive/Squeeze/QA_Squeeze_Squad/squeeze-bert-squad-QA',\n"," 0.04644906514503649,\n"," 0.18316448434589336,\n"," 0.133588030588075,\n"," 0.18208277306962864)"]},"metadata":{},"execution_count":117}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"Nbd8wXrryHph","executionInfo":{"status":"ok","timestamp":1632419492152,"user_tz":-210,"elapsed":517,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"e1662d33-807f-4535-c777-a490b40a0936"},"source":["df['Unnamed: 0'][3],df['BLEU'][3],  df['ROUGE_1'][3], df['ROUGE_2'][3], df['ROUGE_l'][3]"],"execution_count":118,"outputs":[{"output_type":"execute_result","data":{"text/plain":["('/content/drive/My Drive/base_bert/final_base_bert_QA_checkpoint',\n"," 0.051796216153443916,\n"," 0.2225680806645339,\n"," 0.17216889426750046,\n"," 0.22153564830299854)"]},"metadata":{},"execution_count":118}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"VJDkp_lTyMEI","executionInfo":{"status":"ok","timestamp":1632419508863,"user_tz":-210,"elapsed":465,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"82d129eb-a911-4e8e-f6ed-1eed170a7cd2"},"source":["df['Unnamed: 0'][4],df['BLEU'][4],  df['ROUGE_1'][4], df['ROUGE_2'][4], df['ROUGE_l'][4]"],"execution_count":119,"outputs":[{"output_type":"execute_result","data":{"text/plain":["('/content/drive/My Drive/base_bert/MLM_base_bert',\n"," 0.0623308143722647,\n"," 0.20567073421978976,\n"," 0.15514268988697952,\n"," 0.204525759253429)"]},"metadata":{},"execution_count":119}]},{"cell_type":"markdown","metadata":{"id":"WX5ytzRqD10j"},"source":["```\n"," Model name:  Final_squeeze-squad\n"," Bleu Scores:  0.04644906514503649,\n"," Rouge_1 Scores average0.18316448434589336,\n"," Rouge_1 Scores average 0.133588030588075,\n"," Rouge_2 Scores average 0.18208277306962864 \n","```\n","--- \n","```\n"," Model name:   Final_squeeze_MLM\n"," Bleu Scores:  0.047861168051024916,\n"," Rouge_1 Scores average 0.17696092711645833,\n"," Rouge_2 Scores average 0.12715152845920613,\n"," Rouge_l Scores average 0.17566550960893856\n","  \n","```\n","---  \n","```\n"," Model name:  squeeze-bert-squad-QA\n"," Bleu Scores:  0.04644906514503649,\n"," Rouge_1 Scores average 0.18316448434589336,\n"," Rouge_2 Scores average  0.133588030588075,\n"," Rouge_l Scores average 0.18208277306962864\n","```\n","---\n","``` \n"," Model name:  final_base_bert_QA_checkpoint\n"," Bleu Scores:  0.051796216153443916,\n"," Rouge_1 Scores average  0.2225680806645339,\n"," Rouge_2 Scores average  0.17216889426750046,\n"," Rouge_l Scores average  0.22153564830299854\n","```\n","---\n","``` \n"," Model name:  MLM_base_bert\n"," Bleu Scores:  0.0623308143722647,\n"," Rouge_1 Scores average  0.20567073421978976,\n"," Rouge_2 Scores average  0.15514268988697952,\n"," Rouge_l Scores average  0.204525759253429\n","```\n","---\n"]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/","height":272},"id":"Pf2xpu1oLxiH","executionInfo":{"status":"ok","timestamp":1632417650717,"user_tz":-210,"elapsed":487,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"57035753-4957-4fcd-9c81-1c63712446b6"},"source":["df"],"execution_count":88,"outputs":[{"output_type":"execute_result","data":{"text/html":["<div>\n","<style scoped>\n","    .dataframe tbody tr th:only-of-type {\n","        vertical-align: middle;\n","    }\n","\n","    .dataframe tbody tr th {\n","        vertical-align: top;\n","    }\n","\n","    .dataframe thead th {\n","        text-align: right;\n","    }\n","</style>\n","<table border=\"1\" class=\"dataframe\">\n","  <thead>\n","    <tr style=\"text-align: right;\">\n","      <th></th>\n","      <th>Type</th>\n","      <th>BLEU</th>\n","      <th>ROUGE_1</th>\n","      <th>ROUGE_2</th>\n","      <th>ROUGE_l</th>\n","    </tr>\n","  </thead>\n","  <tbody>\n","    <tr>\n","      <th>/content/drive/My Drive/2_squeeze/Final_squeeze-squad</th>\n","      <td>question_answering</td>\n","      <td>0.0458353</td>\n","      <td>0.198548</td>\n","      <td>0.1485</td>\n","      <td>0.197702</td>\n","    </tr>\n","    <tr>\n","      <th>/content/drive/My Drive/2_squeeze/Squeeze-bert_MLM/MLM_output_dir/Final_squeeze_MLM</th>\n","      <td>question_answering</td>\n","      <td>0.0478612</td>\n","      <td>0.176961</td>\n","      <td>0.127152</td>\n","      <td>0.175666</td>\n","    </tr>\n","    <tr>\n","      <th>/content/drive/My Drive/Squeeze/QA_Squeeze_Squad/squeeze-bert-squad-QA</th>\n","      <td>question_answering</td>\n","      <td>0.0464491</td>\n","      <td>0.183164</td>\n","      <td>0.133588</td>\n","      <td>0.182083</td>\n","    </tr>\n","    <tr>\n","      <th>/content/drive/My Drive/base_bert/final_base_bert_QA_checkpoint</th>\n","      <td>question_answering</td>\n","      <td>0.0517962</td>\n","      <td>0.222568</td>\n","      <td>0.172169</td>\n","      <td>0.221536</td>\n","    </tr>\n","    <tr>\n","      <th>/content/drive/My Drive/base_bert/MLM_base_bert</th>\n","      <td>question_answering</td>\n","      <td>0.0623308</td>\n","      <td>0.205671</td>\n","      <td>0.155143</td>\n","      <td>0.204526</td>\n","    </tr>\n","    <tr>\n","      <th>/content/drive/My Drive/base_bert/QA_base_bert</th>\n","      <td>question_answering</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","    </tr>\n","  </tbody>\n","</table>\n","</div>"],"text/plain":["                                                                  Type  ...   ROUGE_l\n","/content/drive/My Drive/2_squeeze/Final_squeeze...  question_answering  ...  0.197702\n","/content/drive/My Drive/2_squeeze/Squeeze-bert_...  question_answering  ...  0.175666\n","/content/drive/My Drive/Squeeze/QA_Squeeze_Squa...  question_answering  ...  0.182083\n","/content/drive/My Drive/base_bert/final_base_be...  question_answering  ...  0.221536\n","/content/drive/My Drive/base_bert/MLM_base_bert     question_answering  ...  0.204526\n","/content/drive/My Drive/base_bert/QA_base_bert      question_answering  ...       NaN\n","\n","[6 rows x 5 columns]"]},"metadata":{},"execution_count":88}]},{"cell_type":"code","metadata":{"id":"xKU5BhiGQErn","executionInfo":{"status":"ok","timestamp":1632417801238,"user_tz":-210,"elapsed":999,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}}},"source":["df.to_csv('qa_finetune_model.csv')"],"execution_count":89,"outputs":[]},{"cell_type":"code","metadata":{"id":"HGhoAqCPura2","executionInfo":{"status":"ok","timestamp":1632417808738,"user_tz":-210,"elapsed":469,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}}},"source":["df = pd.read_csv('qa_finetune_model.csv')"],"execution_count":90,"outputs":[]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/","height":237},"id":"lLyCMD3evZxT","executionInfo":{"status":"ok","timestamp":1632417813427,"user_tz":-210,"elapsed":463,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"82bb34f5-de7e-48c7-8013-9d01378510c1"},"source":["df"],"execution_count":91,"outputs":[{"output_type":"execute_result","data":{"text/html":["<div>\n","<style scoped>\n","    .dataframe tbody tr th:only-of-type {\n","        vertical-align: middle;\n","    }\n","\n","    .dataframe tbody tr th {\n","        vertical-align: top;\n","    }\n","\n","    .dataframe thead th {\n","        text-align: right;\n","    }\n","</style>\n","<table border=\"1\" class=\"dataframe\">\n","  <thead>\n","    <tr style=\"text-align: right;\">\n","      <th></th>\n","      <th>Unnamed: 0</th>\n","      <th>Type</th>\n","      <th>BLEU</th>\n","      <th>ROUGE_1</th>\n","      <th>ROUGE_2</th>\n","      <th>ROUGE_l</th>\n","    </tr>\n","  </thead>\n","  <tbody>\n","    <tr>\n","      <th>0</th>\n","      <td>/content/drive/My Drive/2_squeeze/Final_squeez...</td>\n","      <td>question_answering</td>\n","      <td>0.045835</td>\n","      <td>0.198548</td>\n","      <td>0.148500</td>\n","      <td>0.197702</td>\n","    </tr>\n","    <tr>\n","      <th>1</th>\n","      <td>/content/drive/My Drive/2_squeeze/Squeeze-bert...</td>\n","      <td>question_answering</td>\n","      <td>0.047861</td>\n","      <td>0.176961</td>\n","      <td>0.127152</td>\n","      <td>0.175666</td>\n","    </tr>\n","    <tr>\n","      <th>2</th>\n","      <td>/content/drive/My Drive/Squeeze/QA_Squeeze_Squ...</td>\n","      <td>question_answering</td>\n","      <td>0.046449</td>\n","      <td>0.183164</td>\n","      <td>0.133588</td>\n","      <td>0.182083</td>\n","    </tr>\n","    <tr>\n","      <th>3</th>\n","      <td>/content/drive/My Drive/base_bert/final_base_b...</td>\n","      <td>question_answering</td>\n","      <td>0.051796</td>\n","      <td>0.222568</td>\n","      <td>0.172169</td>\n","      <td>0.221536</td>\n","    </tr>\n","    <tr>\n","      <th>4</th>\n","      <td>/content/drive/My Drive/base_bert/MLM_base_bert</td>\n","      <td>question_answering</td>\n","      <td>0.062331</td>\n","      <td>0.205671</td>\n","      <td>0.155143</td>\n","      <td>0.204526</td>\n","    </tr>\n","    <tr>\n","      <th>5</th>\n","      <td>/content/drive/My Drive/base_bert/QA_base_bert</td>\n","      <td>question_answering</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","      <td>NaN</td>\n","    </tr>\n","  </tbody>\n","</table>\n","</div>"],"text/plain":["                                          Unnamed: 0  ...   ROUGE_l\n","0  /content/drive/My Drive/2_squeeze/Final_squeez...  ...  0.197702\n","1  /content/drive/My Drive/2_squeeze/Squeeze-bert...  ...  0.175666\n","2  /content/drive/My Drive/Squeeze/QA_Squeeze_Squ...  ...  0.182083\n","3  /content/drive/My Drive/base_bert/final_base_b...  ...  0.221536\n","4    /content/drive/My Drive/base_bert/MLM_base_bert  ...  0.204526\n","5     /content/drive/My Drive/base_bert/QA_base_bert  ...       NaN\n","\n","[6 rows x 6 columns]"]},"metadata":{},"execution_count":91}]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"6P-PK_r8OQQl","executionInfo":{"status":"ok","timestamp":1632417931425,"user_tz":-210,"elapsed":610,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"2bffab6c-f5d9-4fc2-c886-d09e030877a6"},"source":["# list(df.iloc[7:]['Unnamed: 0'])"],"execution_count":98,"outputs":[{"output_type":"execute_result","data":{"text/plain":["['/content/drive/My Drive/base_bert/final_base_bert_QA_checkpoint',\n"," '/content/drive/My Drive/base_bert/MLM_base_bert',\n"," '/content/drive/My Drive/base_bert/QA_base_bert']"]},"metadata":{},"execution_count":98}]},{"cell_type":"code","metadata":{"id":"_vAb9djfOLGi","executionInfo":{"status":"ok","timestamp":1632417857169,"user_tz":-210,"elapsed":538,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}}},"source":["# index = list(df.iloc[7:]['Unnamed: 0'])"],"execution_count":93,"outputs":[]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/","height":481},"id":"Ys5wOUp_3p44","executionInfo":{"status":"ok","timestamp":1632417858942,"user_tz":-210,"elapsed":1253,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"6b26a40c-b5da-4dbe-c1a9-8d793f93e905"},"source":["df.iloc[:6].plot.bar(rot=0, subplots=True, figsize=(8, 6))"],"execution_count":94,"outputs":[{"output_type":"execute_result","data":{"text/plain":["array([<matplotlib.axes._subplots.AxesSubplot object at 0x7f600e1ee250>,\n","       <matplotlib.axes._subplots.AxesSubplot object at 0x7f6012335250>,\n","       <matplotlib.axes._subplots.AxesSubplot object at 0x7f600e1ee2d0>,\n","       <matplotlib.axes._subplots.AxesSubplot object at 0x7f6012375990>],\n","      dtype=object)"]},"metadata":{},"execution_count":94},{"output_type":"display_data","data":{"image/png":"\n","text/plain":["<Figure size 576x432 with 4 Axes>"]},"metadata":{"needs_background":"light"}}]},{"cell_type":"code","metadata":{"id":"j3I3FobLNgJ3","executionInfo":{"status":"ok","timestamp":1632417970633,"user_tz":-210,"elapsed":534,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}}},"source":["# df.iloc[7:].plot.bar(rot=0, subplots=True, figsize=(16, 8))"],"execution_count":99,"outputs":[]},{"cell_type":"code","metadata":{"colab":{"base_uri":"https://localhost:8080/","height":492},"id":"AsCAmTELQuf4","executionInfo":{"status":"ok","timestamp":1632417881917,"user_tz":-210,"elapsed":1419,"user":{"displayName":"zahra nafarieh","photoUrl":"https://lh3.googleusercontent.com/a/default-user=s64","userId":"05175754217722450138"}},"outputId":"1e650350-5275-40e2-eb61-d2baaaa5fcfa"},"source":["df.plot.bar(rot=0, subplots=True, figsize=(20, 8))"],"execution_count":96,"outputs":[{"output_type":"execute_result","data":{"text/plain":["array([<matplotlib.axes._subplots.AxesSubplot object at 0x7f600dcc2310>,\n","       <matplotlib.axes._subplots.AxesSubplot object at 0x7f600dc09910>,\n","       <matplotlib.axes._subplots.AxesSubplot object at 0x7f600dcc2d90>,\n","       <matplotlib.axes._subplots.AxesSubplot object at 0x7f600db790d0>],\n","      dtype=object)"]},"metadata":{},"execution_count":96},{"output_type":"display_data","data":{"image/png":"\n","text/plain":["<Figure size 1440x576 with 4 Axes>"]},"metadata":{"needs_background":"light"}}]},{"cell_type":"code","metadata":{"id":"balb23Y6Sh8v"},"source":[""],"execution_count":null,"outputs":[]}]}
\ No newline at end of file