diff --git a/ML/Pytorch/huggingface/.ipynb_checkpoints/Untitled-checkpoint.ipynb b/ML/Pytorch/huggingface/.ipynb_checkpoints/Untitled-checkpoint.ipynb
deleted file mode 100644
index 363fcab..0000000
--- a/ML/Pytorch/huggingface/.ipynb_checkpoints/Untitled-checkpoint.ipynb
+++ /dev/null
@@ -1,6 +0,0 @@
-{
- "cells": [],
- "metadata": {},
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/ML/Pytorch/huggingface/.ipynb_checkpoints/cnndaily_t5_lightning_customdataloading-checkpoint.ipynb b/ML/Pytorch/huggingface/.ipynb_checkpoints/cnndaily_t5_lightning_customdataloading-checkpoint.ipynb
deleted file mode 100644
index a3216e9..0000000
--- a/ML/Pytorch/huggingface/.ipynb_checkpoints/cnndaily_t5_lightning_customdataloading-checkpoint.ipynb
+++ /dev/null
@@ -1,317 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f54ecf0b",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\"\"\"\n",
-    "# HuggingFace Tutorial Series\n",
-    "- 1. What is Huggingface?\n",
-    "- 2. Common tasks we can do with HuggingFace & explain the tasks briefly, like what is question answering etc\n",
-    "- 3. Using the HuggingFace Pipeline (High level feature)\n",
-    "- 4. How the pipeline works at a lower level\n",
-    "- 5. HuggingFace Datasets\n",
-    "- 6. HuggingFace Tokenizer\n",
-    "- 7. HuggingFace Evaluate\n",
-    "- 8. HuggingFace Trainer\n",
-    "- 9. Putting it together to finetune a news article summarizer\n",
-    "- 10. Making it more general and robust with Lightning and custom data loading\n",
-    "\"\"\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "ec1aae37",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import warnings\n",
-    "warnings.simplefilter(\"ignore\")\n",
-    "\n",
-    "import os\n",
-    "os.environ[\"CUDA_DEVICE_ORDER\"]=\"PCI_BUS_ID\"\n",
-    "os.environ[\"CUDA_VISIBLE_DEVICES\"]=\"0\"\n",
-    "\n",
-    "import numpy as np\n",
-    "import torch\n",
-    "import datasets \n",
-    "import pytorch_lightning as pl\n",
-    "from datasets import load_dataset, load_metric\n",
-    "\n",
-    "from transformers import (\n",
-    "    AutoModel,\n",
-    "    AutoModelForSeq2SeqLM,\n",
-    "    AutoTokenizer,\n",
-    "    DataCollatorForSeq2Seq,\n",
-    "    Seq2SeqTrainingArguments,\n",
-    "    Seq2SeqTrainer,\n",
-    ")\n",
-    "\n",
-    "import torch\n",
-    "import pandas as pd\n",
-    "from torch.utils.data import Dataset\n",
-    "import pytorch_lightning as pl\n",
-    "\n",
-    "torch.set_float32_matmul_precision(\"medium\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "5fd7cb0c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "model_name = \"t5-small\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(model_name)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "418cb03a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "class cnn_dailymail(Dataset):\n",
-    "    def __init__(self, csv_file, tokenizer, max_length=512):\n",
-    "        self.data = pd.read_csv(csv_file)\n",
-    "        self.tokenizer = tokenizer\n",
-    "        self.max_length = max_length\n",
-    "\n",
-    "    def __len__(self):\n",
-    "        return len(self.data)\n",
-    "\n",
-    "    def __getitem__(self, idx):\n",
-    "        article = self.data.loc[idx, 'article']\n",
-    "        highlights = self.data.loc[idx, 'highlights']\n",
-    "\n",
-    "        inputs = self.tokenizer(\n",
-    "            article,\n",
-    "            truncation=True,\n",
-    "            padding='max_length',\n",
-    "            max_length=self.max_length,\n",
-    "            return_tensors='pt'\n",
-    "        )\n",
-    "        targets = self.tokenizer(\n",
-    "            highlights,\n",
-    "            truncation=True,\n",
-    "            padding='max_length',\n",
-    "            max_length=self.max_length,\n",
-    "            return_tensors='pt'\n",
-    "        )\n",
-    "\n",
-    "        return {\n",
-    "            'input_ids': inputs['input_ids'].squeeze(),\n",
-    "            'attention_mask': inputs['attention_mask'].squeeze(),\n",
-    "            'labels': targets['input_ids'].squeeze()\n",
-    "        }"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "aaa62755",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "class MyDataModule(pl.LightningDataModule):\n",
-    "    def __init__(self, train_csv, val_csv, test_csv, tokenizer, batch_size=16, max_length=512):\n",
-    "        super().__init__()\n",
-    "        self.train_csv = train_csv\n",
-    "        self.val_csv = val_csv\n",
-    "        self.test_csv = test_csv\n",
-    "        self.tokenizer = tokenizer\n",
-    "        self.batch_size = batch_size\n",
-    "        self.max_length = max_length\n",
-    "\n",
-    "    def setup(self, stage=None):\n",
-    "        if stage in ('fit', None):\n",
-    "            self.train_dataset = cnn_dailymail(self.train_csv, self.tokenizer, self.max_length)\n",
-    "            self.val_dataset = cnn_dailymail(self.val_csv, self.tokenizer, self.max_length)\n",
-    "        if stage in ('test', None):\n",
-    "            self.test_dataset = cnn_dailymail(self.test_csv, self.tokenizer, self.max_length)\n",
-    "\n",
-    "    def train_dataloader(self):\n",
-    "        return torch.utils.data.DataLoader(self.train_dataset, batch_size=self.batch_size, shuffle=True, num_workers=4)\n",
-    "\n",
-    "    def val_dataloader(self):\n",
-    "        return torch.utils.data.DataLoader(self.val_dataset, batch_size=self.batch_size, shuffle=False, num_workers=2)\n",
-    "\n",
-    "    def test_dataloader(self):\n",
-    "        return torch.utils.data.DataLoader(self.test_dataset, batch_size=self.batch_size, shuffle=False, num_workers=2)\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "fbb699e1",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "class MyLightningModule(pl.LightningModule):\n",
-    "    def __init__(self, model_name, learning_rate, weight_decay):\n",
-    "        super().__init__()\n",
-    "        self.model_name = model_name\n",
-    "        self.learning_rate = learning_rate\n",
-    "        self.weight_decay = weight_decay\n",
-    "        \n",
-    "        # Load the pre-trained model and tokenizer\n",
-    "        self.model = torch.compile(AutoModelForSeq2SeqLM.from_pretrained(self.model_name))\n",
-    "        \n",
-    "        # Load the ROUGE metric\n",
-    "        self.metric = load_metric(\"rouge\")\n",
-    "\n",
-    "    def forward(self, input_ids, attention_mask, labels=None):\n",
-    "        output = self.model(\n",
-    "            input_ids=input_ids,\n",
-    "            attention_mask=attention_mask,\n",
-    "            labels=labels,\n",
-    "        )\n",
-    "        return output.loss, output.logits\n",
-    "    \n",
-    "    def training_step(self, batch, batch_idx):\n",
-    "        input_ids = batch[\"input_ids\"]\n",
-    "        attention_mask = batch[\"attention_mask\"]\n",
-    "        labels = batch[\"labels\"]\n",
-    "        loss, logits = self(input_ids, attention_mask, labels)\n",
-    "        self.log('train_loss', loss, on_epoch=True, on_step=True, prog_bar=True)\n",
-    "        return {'loss': loss, 'logits': logits}\n",
-    "    \n",
-    "    def validation_step(self, batch, batch_idx):\n",
-    "        input_ids = batch[\"input_ids\"]\n",
-    "        attention_mask = batch[\"attention_mask\"]\n",
-    "        labels = batch[\"labels\"]\n",
-    "        loss, logits = self(input_ids, attention_mask, labels)\n",
-    "        self.log('val_loss', loss, on_epoch=True, on_step=False)\n",
-    "        \n",
-    "        # Save logits and labels as instance attributes\n",
-    "        if not hasattr(self, \"logits\"):\n",
-    "            self.logits = logits\n",
-    "        else:\n",
-    "            self.logits = torch.cat((self.logits, logits), dim=0)\n",
-    "        \n",
-    "        if not hasattr(self, \"labels\"):\n",
-    "            self.labels = labels\n",
-    "        else:\n",
-    "            self.labels = torch.cat((self.labels, labels), dim=0)\n",
-    "            \n",
-    "        return {'loss': loss, 'logits': logits, \"labels\":labels}\n",
-    "    \n",
-    "    def on_validation_epoch_end(self):\n",
-    "        # Convert logits to predicted token IDs\n",
-    "        pred_token_ids = self.logits.argmax(dim=-1)\n",
-    "\n",
-    "        # Decode predictions and labels using the saved instance attributes\n",
-    "        decoded_preds = tokenizer.batch_decode(pred_token_ids, skip_special_tokens=True)\n",
-    "        decoded_labels = tokenizer.batch_decode(self.labels, skip_special_tokens=True)\n",
-    "\n",
-    "        # Compute ROUGE scores\n",
-    "        scores = self.metric.compute(predictions=decoded_preds, references=decoded_labels, rouge_types=[\"rouge1\"])[\"rouge1\"].mid\n",
-    "\n",
-    "        self.log('rouge1_precision', scores.precision, prog_bar=True)\n",
-    "        self.log('rouge1_recall', scores.recall, prog_bar=True)\n",
-    "        self.log('rouge1_fmeasure', scores.fmeasure, prog_bar=True)\n",
-    "\n",
-    "        # Clear logits and labels instance attributes for the next validation epoch\n",
-    "        del self.logits\n",
-    "        del self.labels\n",
-    "    \n",
-    "    def configure_optimizers(self):\n",
-    "        optimizer = torch.optim.AdamW(self.parameters(), lr=self.learning_rate, weight_decay=self.weight_decay)\n",
-    "        return optimizer\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "dd63c628",
-   "metadata": {
-    "scrolled": true
-   },
-   "outputs": [],
-   "source": [
-    "# File paths\n",
-    "train_csv = \"train.csv\"\n",
-    "val_csv = \"validation.csv\"\n",
-    "test_csv = \"test.csv\"\n",
-    "\n",
-    "# Create the data module\n",
-    "dm = MyDataModule(train_csv, val_csv, test_csv, tokenizer, batch_size=16)\n",
-    "dm.setup()\n",
-    "\n",
-    "model = MyLightningModule(model_name=\"t5-small\", learning_rate=1e-4, weight_decay=1e-5)\n",
-    "trainer = pl.Trainer(accelerator=\"gpu\", devices=[0], max_epochs=1, precision=16)\n",
-    "trainer.fit(model, datamodule=dm)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b5d3d684",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "http://localhost:18888/notebooks/cnndaily_t5_lightning_customdataloading.ipynb"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a0494596",
-   "metadata": {},
-   "source": [
-    "### next steps:\n",
-    "* if article is > 512, because now we are truncating maybe it causes issues if the article is much longer?\n",
-    "\n",
-    "#### what we've done:\n",
-    "* Change the data loading so it's more general, meaning on the fly loading from disk\n",
-    "* add torch.compile\n",
-    "* 1. Clean up the code, make it into scripts instead of notebook -> Train for an epoch (add multi-gpu training?)\n",
-    "* add tensorboard visualization\n",
-    "* not use pretrained weights but from scratch to ensure that training setup works and actually improving\n",
-    "* 2. Create an inference step, send in news article -> get summary, check that it works\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "80a2efab",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0f9b71ab",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.9"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/ML/Pytorch/huggingface/.ipynb_checkpoints/finetune_t5_lightning-checkpoint.ipynb b/ML/Pytorch/huggingface/.ipynb_checkpoints/finetune_t5_lightning-checkpoint.ipynb
deleted file mode 100644
index e3220a5..0000000
--- a/ML/Pytorch/huggingface/.ipynb_checkpoints/finetune_t5_lightning-checkpoint.ipynb
+++ /dev/null
@@ -1,463 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": 2,
-   "id": "ec1aae37",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2023-02-21 16:36:20.707209: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  AVX2 FMA\n",
-      "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
-      "2023-02-21 16:36:21.233575: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory\n",
-      "2023-02-21 16:36:21.233623: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory\n",
-      "2023-02-21 16:36:21.233628: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly.\n"
-     ]
-    }
-   ],
-   "source": [
-    "import warnings\n",
-    "warnings.simplefilter(\"ignore\")\n",
-    "\n",
-    "import os\n",
-    "os.environ[\"CUDA_DEVICE_ORDER\"]=\"PCI_BUS_ID\"\n",
-    "os.environ[\"CUDA_VISIBLE_DEVICES\"]=\"1\"\n",
-    "\n",
-    "import numpy as np\n",
-    "import torch\n",
-    "\n",
-    "import datasets \n",
-    "import pytorch_lightning as pl\n",
-    "\n",
-    "from datasets import load_dataset, load_metric\n",
-    "\n",
-    "from transformers import (\n",
-    "    AutoModel,\n",
-    "    AutoModelForSeq2SeqLM,\n",
-    "    AutoTokenizer,\n",
-    "    DataCollatorForSeq2Seq,\n",
-    "    Seq2SeqTrainingArguments,\n",
-    "    Seq2SeqTrainer,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "id": "5fd7cb0c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "model_name = \"t5-small\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(model_name)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "id": "04530b1e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Define the LightningDataModule\n",
-    "class MyDataModule(pl.LightningDataModule):\n",
-    "    def __init__(self, batch_size):\n",
-    "        super().__init__()\n",
-    "        self.batch_size = batch_size\n",
-    "    \n",
-    "    def prepare_data(self):\n",
-    "        # Download and preprocess the data\n",
-    "        load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"train[:10%]\")\n",
-    "        load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"validation[:10%]\")\n",
-    "    \n",
-    "    def setup(self, stage=None):\n",
-    "        # Load and preprocess the data\n",
-    "        train_data = load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"train[:10%]\")\n",
-    "        val_data = load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"validation[:10%]\")\n",
-    "\n",
-    "        self.train_ds = train_data.map(\n",
-    "            self.preprocess_function, \n",
-    "            batched=True, \n",
-    "            batch_size=self.batch_size, \n",
-    "            remove_columns=[\"article\", \"highlights\", \"id\"]\n",
-    "        )\n",
-    "\n",
-    "        self.val_ds = val_data.map(\n",
-    "            self.preprocess_function, \n",
-    "            batched=True, \n",
-    "            batch_size=self.batch_size,\n",
-    "            remove_columns=[\"article\", \"highlights\", \"id\"]\n",
-    "        )\n",
-    "\n",
-    "    def preprocess_function(self, batch):\n",
-    "        inputs = tokenizer(batch[\"article\"], padding=\"max_length\", truncation=True, max_length=512)\n",
-    "        outputs = tokenizer(batch[\"highlights\"], padding=\"max_length\", truncation=True, max_length=128)\n",
-    "        batch[\"input_ids\"] = inputs.input_ids\n",
-    "        batch[\"attention_mask\"] = inputs.attention_mask\n",
-    "        batch[\"labels\"] = outputs.input_ids.copy()\n",
-    "        return batch\n",
-    "\n",
-    "    def train_dataloader(self):\n",
-    "        return torch.utils.data.DataLoader(self.train_ds, batch_size=self.batch_size)\n",
-    "\n",
-    "    def val_dataloader(self):\n",
-    "        return torch.utils.data.DataLoader(self.val_ds, batch_size=self.batch_size)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 7,
-   "id": "fbb699e1",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "class MyLightningModule(pl.LightningModule):\n",
-    "    def __init__(self, model_name, learning_rate, weight_decay, batch_size):\n",
-    "        super().__init__()\n",
-    "        self.model_name = model_name\n",
-    "        self.learning_rate = learning_rate\n",
-    "        self.weight_decay = weight_decay\n",
-    "        self.batch_size = batch_size\n",
-    "        \n",
-    "        # Load the pre-trained model and tokenizer\n",
-    "        self.model = AutoModelForSeq2SeqLM.from_pretrained(self.model_name)\n",
-    "\n",
-    "        # Load the ROUGE metric\n",
-    "        self.metric = load_metric(\"rouge\")\n",
-    "\n",
-    "    def forward(self, input_ids, attention_mask, labels=None):\n",
-    "        output = self.model(\n",
-    "            input_ids=input_ids,\n",
-    "            attention_mask=attention_mask,\n",
-    "            labels=labels,\n",
-    "        )\n",
-    "        return output.loss, output.logits\n",
-    "    \n",
-    "    def training_step(self, batch, batch_idx):\n",
-    "        input_ids = batch[\"input_ids\"]\n",
-    "        attention_mask = batch[\"attention_mask\"]\n",
-    "        labels = batch[\"labels\"]\n",
-    "        loss, logits = self(input_ids, attention_mask, labels)\n",
-    "        self.log('train_loss', loss, on_epoch=True, on_step=False)\n",
-    "        return {'loss': loss, 'logits': logits}\n",
-    "    \n",
-    "    def validation_step(self, batch, batch_idx):\n",
-    "        input_ids = batch[\"input_ids\"]\n",
-    "        attention_mask = batch[\"attention_mask\"]\n",
-    "        labels = batch[\"labels\"]\n",
-    "        loss, logits = self(input_ids, attention_mask, labels)\n",
-    "        self.log('val_loss', loss, on_epoch=True, on_step=False)\n",
-    "        return {'loss': loss, 'logits': logits, \"labels\":labels}\n",
-    "    \n",
-    "    def validation_epoch_end(self, outputs):\n",
-    "        decoded_preds = []\n",
-    "        decoded_labels = []\n",
-    "        for output in outputs:\n",
-    "            logits = output['logits']\n",
-    "            labels = output['labels']\n",
-    "            decoded_preds += self.tokenizer.batch_decode(logits, skip_special_tokens=True)\n",
-    "            decoded_labels += self.tokenizer.batch_decode(labels, skip_special_tokens=True)\n",
-    "        \n",
-    "        scores = self.metric.compute(predictions=decoded_preds, references=decoded_labels, rouge_types=[\"rouge1\"])[\"rouge1\"].mid\n",
-    "        \n",
-    "        self.log('rouge1_precision', scores.precision, prog_bar=True)\n",
-    "        self.log('rouge1_recall', scores.recall, prog_bar=True)\n",
-    "        self.log('rouge1_fmeasure', scores.fmeasure, prog_bar=True)\n",
-    "    \n",
-    "    def configure_optimizers(self):\n",
-    "        optimizer = torch.optim.AdamW(self.parameters(), lr=self.learning_rate, weight_decay=self.weight_decay)\n",
-    "        return optimizer\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 8,
-   "id": "dd63c628",
-   "metadata": {
-    "scrolled": false
-   },
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "GPU available: True (cuda), used: True\n",
-      "TPU available: False, using: 0 TPU cores\n",
-      "IPU available: False, using: 0 IPUs\n",
-      "HPU available: False, using: 0 HPUs\n",
-      "Found cached dataset cnn_dailymail (/home/mrbean/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/1b3c71476f6d152c31c1730e83ccb08bcf23e348233f4fcc11e182248e6bf7de)\n",
-      "Found cached dataset cnn_dailymail (/home/mrbean/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/1b3c71476f6d152c31c1730e83ccb08bcf23e348233f4fcc11e182248e6bf7de)\n",
-      "Found cached dataset cnn_dailymail (/home/mrbean/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/1b3c71476f6d152c31c1730e83ccb08bcf23e348233f4fcc11e182248e6bf7de)\n",
-      "Found cached dataset cnn_dailymail (/home/mrbean/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/1b3c71476f6d152c31c1730e83ccb08bcf23e348233f4fcc11e182248e6bf7de)\n",
-      "\n",
-      "  0%|                                                                                                                                               | 0/1795 [00:00<?, ?ba/s]\u001b[A\n",
-      "  1%|▉                                                                                                                                    | 13/1795 [00:00<00:14, 121.44ba/s]\u001b[A\n",
-      "  1%|█▉                                                                                                                                   | 26/1795 [00:00<00:15, 117.31ba/s]\u001b[A\n",
-      "  2%|██▊                                                                                                                                  | 38/1795 [00:00<00:15, 114.50ba/s]\u001b[A\n",
-      "  3%|███▋                                                                                                                                 | 50/1795 [00:00<00:15, 114.43ba/s]\u001b[A\n",
-      "  3%|████▌                                                                                                                                | 62/1795 [00:00<00:15, 115.53ba/s]\u001b[A\n",
-      "  4%|█████▍                                                                                                                               | 74/1795 [00:00<00:15, 113.50ba/s]\u001b[A\n",
-      "  5%|██████▎                                                                                                                              | 86/1795 [00:00<00:15, 111.92ba/s]\u001b[A\n",
-      "  5%|███████▎                                                                                                                             | 98/1795 [00:00<00:15, 111.38ba/s]\u001b[A\n",
-      "  6%|████████                                                                                                                            | 110/1795 [00:00<00:15, 112.08ba/s]\u001b[A\n",
-      "  7%|████████▉                                                                                                                           | 122/1795 [00:01<00:14, 113.73ba/s]\u001b[A\n",
-      "  7%|█████████▊                                                                                                                          | 134/1795 [00:01<00:14, 113.43ba/s]\u001b[A\n",
-      "  8%|██████████▋                                                                                                                         | 146/1795 [00:01<00:14, 111.37ba/s]\u001b[A\n",
-      "  9%|███████████▌                                                                                                                        | 158/1795 [00:01<00:14, 111.32ba/s]\u001b[A\n",
-      "  9%|████████████▌                                                                                                                       | 170/1795 [00:01<00:14, 110.29ba/s]\u001b[A\n",
-      " 10%|█████████████▍                                                                                                                      | 182/1795 [00:01<00:14, 110.06ba/s]\u001b[A\n",
-      " 11%|██████████████▎                                                                                                                     | 194/1795 [00:01<00:14, 111.06ba/s]\u001b[A\n",
-      " 11%|███████████████▏                                                                                                                    | 206/1795 [00:01<00:14, 111.15ba/s]\u001b[A\n",
-      " 12%|████████████████                                                                                                                    | 218/1795 [00:01<00:14, 110.27ba/s]\u001b[A\n",
-      " 13%|████████████████▉                                                                                                                   | 230/1795 [00:02<00:14, 109.17ba/s]\u001b[A\n",
-      " 13%|█████████████████▋                                                                                                                  | 241/1795 [00:02<00:14, 107.81ba/s]\u001b[A\n",
-      " 14%|██████████████████▌                                                                                                                 | 252/1795 [00:02<00:14, 107.84ba/s]\u001b[A\n",
-      " 15%|███████████████████▎                                                                                                                | 263/1795 [00:02<00:14, 107.73ba/s]\u001b[A\n",
-      " 15%|████████████████████▏                                                                                                               | 274/1795 [00:02<00:14, 107.06ba/s]\u001b[A\n",
-      " 16%|█████████████████████                                                                                                               | 286/1795 [00:02<00:13, 108.37ba/s]\u001b[A\n",
-      " 17%|█████████████████████▊                                                                                                              | 297/1795 [00:02<00:13, 107.89ba/s]\u001b[A\n",
-      " 17%|██████████████████████▋                                                                                                             | 309/1795 [00:02<00:13, 108.63ba/s]\u001b[A\n",
-      " 18%|███████████████████████▌                                                                                                            | 320/1795 [00:02<00:13, 106.85ba/s]\u001b[A\n",
-      " 18%|████████████████████████▎                                                                                                           | 331/1795 [00:03<00:13, 105.16ba/s]\u001b[A\n",
-      " 19%|█████████████████████████▏                                                                                                          | 342/1795 [00:03<00:13, 105.20ba/s]\u001b[A\n",
-      " 20%|█████████████████████████▉                                                                                                          | 353/1795 [00:03<00:13, 106.52ba/s]\u001b[A\n",
-      " 20%|██████████████████████████▊                                                                                                         | 364/1795 [00:03<00:13, 106.07ba/s]\u001b[A\n",
-      " 21%|███████████████████████████▌                                                                                                        | 375/1795 [00:03<00:13, 106.21ba/s]\u001b[A\n",
-      " 22%|████████████████████████████▍                                                                                                       | 386/1795 [00:03<00:13, 106.57ba/s]\u001b[A\n",
-      " 22%|█████████████████████████████▎                                                                                                      | 398/1795 [00:03<00:12, 108.52ba/s]\u001b[A\n",
-      " 23%|██████████████████████████████                                                                                                      | 409/1795 [00:03<00:12, 108.42ba/s]\u001b[A\n",
-      " 23%|██████████████████████████████▉                                                                                                     | 421/1795 [00:03<00:12, 110.30ba/s]\u001b[A\n",
-      " 24%|███████████████████████████████▊                                                                                                    | 433/1795 [00:03<00:12, 108.73ba/s]\u001b[A\n",
-      " 25%|████████████████████████████████▋                                                                                                   | 444/1795 [00:04<00:12, 106.43ba/s]\u001b[A\n",
-      " 25%|█████████████████████████████████▍                                                                                                  | 455/1795 [00:04<00:12, 106.82ba/s]\u001b[A\n",
-      " 26%|██████████████████████████████████▎                                                                                                 | 466/1795 [00:04<00:12, 105.85ba/s]\u001b[A\n",
-      " 27%|███████████████████████████████████                                                                                                 | 477/1795 [00:04<00:12, 107.02ba/s]\u001b[A\n",
-      " 27%|███████████████████████████████████▉                                                                                                | 488/1795 [00:04<00:12, 106.66ba/s]\u001b[A\n",
-      " 28%|████████████████████████████████████▊                                                                                               | 500/1795 [00:04<00:11, 108.59ba/s]\u001b[A\n",
-      " 28%|█████████████████████████████████████▌                                                                                              | 511/1795 [00:04<00:12, 106.49ba/s]\u001b[A\n",
-      " 29%|██████████████████████████████████████▍                                                                                             | 523/1795 [00:04<00:11, 109.26ba/s]\u001b[A\n",
-      " 30%|███████████████████████████████████████▎                                                                                            | 535/1795 [00:04<00:11, 109.78ba/s]\u001b[A\n",
-      " 30%|████████████████████████████████████████▏                                                                                           | 546/1795 [00:04<00:11, 108.30ba/s]\u001b[A\n",
-      " 31%|████████████████████████████████████████▉                                                                                           | 557/1795 [00:05<00:11, 107.77ba/s]\u001b[A\n",
-      " 32%|█████████████████████████████████████████▊                                                                                          | 569/1795 [00:05<00:11, 108.36ba/s]\u001b[A\n",
-      " 32%|██████████████████████████████████████████▋                                                                                         | 580/1795 [00:05<00:11, 107.05ba/s]\u001b[A\n",
-      " 33%|███████████████████████████████████████████▌                                                                                        | 592/1795 [00:05<00:11, 108.48ba/s]\u001b[A\n",
-      " 34%|████████████████████████████████████████████▎                                                                                       | 603/1795 [00:05<00:11, 108.25ba/s]\u001b[A\n",
-      " 34%|█████████████████████████████████████████████▏                                                                                      | 615/1795 [00:05<00:10, 110.59ba/s]\u001b[A\n",
-      " 35%|██████████████████████████████████████████████                                                                                      | 627/1795 [00:05<00:10, 111.44ba/s]\u001b[A\n",
-      " 36%|██████████████████████████████████████████████▉                                                                                     | 639/1795 [00:05<00:10, 109.07ba/s]\u001b[A\n",
-      " 36%|███████████████████████████████████████████████▊                                                                                    | 651/1795 [00:05<00:10, 109.77ba/s]\u001b[A\n",
-      " 37%|████████████████████████████████████████████████▋                                                                                   | 662/1795 [00:06<00:10, 109.69ba/s]\u001b[A\n",
-      " 37%|█████████████████████████████████████████████████▍                                                                                  | 673/1795 [00:06<00:10, 109.08ba/s]\u001b[A\n",
-      " 38%|██████████████████████████████████████████████████▎                                                                                 | 685/1795 [00:06<00:10, 109.77ba/s]\u001b[A\n",
-      " 39%|███████████████████████████████████████████████████▎                                                                                | 697/1795 [00:06<00:10, 109.54ba/s]\u001b[A\n",
-      " 39%|████████████████████████████████████████████████████                                                                                | 708/1795 [00:06<00:09, 109.08ba/s]\u001b[A\n",
-      " 40%|████████████████████████████████████████████████████▉                                                                               | 720/1795 [00:06<00:09, 110.53ba/s]\u001b[A\n",
-      " 41%|█████████████████████████████████████████████████████▊                                                                              | 732/1795 [00:06<00:09, 108.30ba/s]\u001b[A\n",
-      " 41%|██████████████████████████████████████████████████████▋                                                                             | 744/1795 [00:06<00:09, 110.04ba/s]\u001b[A\n",
-      " 42%|███████████████████████████████████████████████████████▌                                                                            | 756/1795 [00:06<00:09, 112.10ba/s]\u001b[A\n",
-      " 43%|████████████████████████████████████████████████████████▍                                                                           | 768/1795 [00:07<00:09, 111.21ba/s]\u001b[A\n",
-      " 43%|█████████████████████████████████████████████████████████▎                                                                          | 780/1795 [00:07<00:09, 111.99ba/s]\u001b[A\n",
-      " 44%|██████████████████████████████████████████████████████████▏                                                                         | 792/1795 [00:07<00:08, 112.21ba/s]\u001b[A\n",
-      " 45%|███████████████████████████████████████████████████████████                                                                         | 804/1795 [00:07<00:09, 109.31ba/s]\u001b[A\n",
-      " 46%|████████████████████████████████████████████████████████████                                                                        | 817/1795 [00:07<00:08, 113.17ba/s]\u001b[A\n",
-      " 46%|████████████████████████████████████████████████████████████▉                                                                       | 829/1795 [00:07<00:08, 113.26ba/s]\u001b[A\n",
-      " 47%|█████████████████████████████████████████████████████████████▊                                                                      | 841/1795 [00:07<00:08, 113.69ba/s]\u001b[A\n",
-      " 48%|██████████████████████████████████████████████████████████████▋                                                                     | 853/1795 [00:07<00:08, 114.08ba/s]\u001b[A\n",
-      " 48%|███████████████████████████████████████████████████████████████▌                                                                    | 865/1795 [00:07<00:08, 112.82ba/s]\u001b[A\n",
-      " 49%|████████████████████████████████████████████████████████████████▍                                                                   | 877/1795 [00:07<00:08, 113.22ba/s]\u001b[A\n",
-      " 50%|█████████████████████████████████████████████████████████████████▍                                                                  | 890/1795 [00:08<00:07, 115.71ba/s]\u001b[A\n",
-      " 50%|██████████████████████████████████████████████████████████████████▎                                                                 | 902/1795 [00:08<00:07, 115.77ba/s]\u001b[A\n",
-      " 51%|███████████████████████████████████████████████████████████████████▏                                                                | 914/1795 [00:08<00:07, 114.07ba/s]\u001b[A\n",
-      " 52%|████████████████████████████████████████████████████████████████████                                                                | 926/1795 [00:08<00:07, 114.19ba/s]\u001b[A\n",
-      " 52%|████████████████████████████████████████████████████████████████████▉                                                               | 938/1795 [00:08<00:07, 115.57ba/s]\u001b[A\n",
-      " 53%|█████████████████████████████████████████████████████████████████████▊                                                              | 950/1795 [00:08<00:07, 115.94ba/s]\u001b[A\n",
-      " 54%|██████████████████████████████████████████████████████████████████████▋                                                             | 962/1795 [00:08<00:07, 116.65ba/s]\u001b[A\n",
-      " 54%|███████████████████████████████████████████████████████████████████████▋                                                            | 974/1795 [00:08<00:07, 113.94ba/s]\u001b[A\n",
-      " 55%|████████████████████████████████████████████████████████████████████████▌                                                           | 986/1795 [00:08<00:07, 111.71ba/s]\u001b[A\n",
-      " 56%|█████████████████████████████████████████████████████████████████████████▍                                                          | 998/1795 [00:09<00:07, 107.78ba/s]\u001b[A\n",
-      " 56%|█████████████████████████████████████████████████████████████████████████▋                                                         | 1009/1795 [00:09<00:07, 105.28ba/s]\u001b[A\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      " 57%|██████████████████████████████████████████████████████████████████████████▌                                                        | 1021/1795 [00:09<00:07, 107.16ba/s]\u001b[A\n",
-      " 57%|███████████████████████████████████████████████████████████████████████████▎                                                       | 1032/1795 [00:09<00:07, 107.83ba/s]\u001b[A\n",
-      " 58%|████████████████████████████████████████████████████████████████████████████▏                                                      | 1044/1795 [00:09<00:06, 109.92ba/s]\u001b[A\n",
-      " 59%|█████████████████████████████████████████████████████████████████████████████                                                      | 1056/1795 [00:09<00:06, 112.47ba/s]\u001b[A\n",
-      " 59%|█████████████████████████████████████████████████████████████████████████████▉                                                     | 1068/1795 [00:09<00:06, 113.56ba/s]\u001b[A\n",
-      " 60%|██████████████████████████████████████████████████████████████████████████████▊                                                    | 1080/1795 [00:09<00:06, 111.84ba/s]\u001b[A\n",
-      " 61%|███████████████████████████████████████████████████████████████████████████████▋                                                   | 1092/1795 [00:09<00:06, 111.27ba/s]\u001b[A\n",
-      " 62%|████████████████████████████████████████████████████████████████████████████████▌                                                  | 1104/1795 [00:10<00:06, 110.39ba/s]\u001b[A\n",
-      " 62%|█████████████████████████████████████████████████████████████████████████████████▍                                                 | 1116/1795 [00:10<00:06, 111.33ba/s]\u001b[A\n",
-      " 63%|██████████████████████████████████████████████████████████████████████████████████▎                                                | 1128/1795 [00:10<00:05, 111.32ba/s]\u001b[A\n",
-      " 64%|███████████████████████████████████████████████████████████████████████████████████▏                                               | 1140/1795 [00:10<00:05, 112.20ba/s]\u001b[A\n",
-      " 64%|████████████████████████████████████████████████████████████████████████████████████▏                                              | 1153/1795 [00:10<00:05, 115.15ba/s]\u001b[A\n",
-      " 65%|█████████████████████████████████████████████████████████████████████████████████████                                              | 1165/1795 [00:10<00:05, 114.07ba/s]\u001b[A\n",
-      " 66%|█████████████████████████████████████████████████████████████████████████████████████▉                                             | 1177/1795 [00:10<00:05, 110.61ba/s]\u001b[A\n",
-      " 66%|██████████████████████████████████████████████████████████████████████████████████████▊                                            | 1189/1795 [00:10<00:05, 110.61ba/s]\u001b[A\n",
-      " 67%|███████████████████████████████████████████████████████████████████████████████████████▋                                           | 1201/1795 [00:10<00:05, 112.56ba/s]\u001b[A\n",
-      " 68%|████████████████████████████████████████████████████████████████████████████████████████▌                                          | 1213/1795 [00:10<00:05, 112.74ba/s]\u001b[A\n",
-      " 68%|█████████████████████████████████████████████████████████████████████████████████████████▍                                         | 1225/1795 [00:11<00:05, 111.53ba/s]\u001b[A\n",
-      " 69%|██████████████████████████████████████████████████████████████████████████████████████████▎                                        | 1237/1795 [00:11<00:05, 110.36ba/s]\u001b[A\n",
-      " 70%|███████████████████████████████████████████████████████████████████████████████████████████▏                                       | 1249/1795 [00:11<00:04, 109.75ba/s]\u001b[A\n",
-      " 70%|███████████████████████████████████████████████████████████████████████████████████████████▉                                       | 1260/1795 [00:11<00:04, 107.40ba/s]\u001b[A\n",
-      " 71%|████████████████████████████████████████████████████████████████████████████████████████████▊                                      | 1271/1795 [00:11<00:04, 106.67ba/s]\u001b[A\n",
-      " 71%|█████████████████████████████████████████████████████████████████████████████████████████████▌                                     | 1282/1795 [00:11<00:04, 106.95ba/s]\u001b[A\n",
-      " 72%|██████████████████████████████████████████████████████████████████████████████████████████████▎                                    | 1293/1795 [00:11<00:04, 107.69ba/s]\u001b[A\n",
-      " 73%|███████████████████████████████████████████████████████████████████████████████████████████████▏                                   | 1304/1795 [00:11<00:04, 107.86ba/s]\u001b[A\n",
-      " 73%|███████████████████████████████████████████████████████████████████████████████████████████████▉                                   | 1315/1795 [00:11<00:04, 107.71ba/s]\u001b[A\n",
-      " 74%|████████████████████████████████████████████████████████████████████████████████████████████████▊                                  | 1326/1795 [00:12<00:04, 107.71ba/s]\u001b[A\n",
-      " 74%|█████████████████████████████████████████████████████████████████████████████████████████████████▌                                 | 1337/1795 [00:12<00:04, 108.29ba/s]\u001b[A\n",
-      " 75%|██████████████████████████████████████████████████████████████████████████████████████████████████▍                                | 1349/1795 [00:12<00:04, 109.37ba/s]\u001b[A\n",
-      " 76%|███████████████████████████████████████████████████████████████████████████████████████████████████▎                               | 1361/1795 [00:12<00:03, 110.19ba/s]\u001b[A\n",
-      " 76%|████████████████████████████████████████████████████████████████████████████████████████████████████▏                              | 1373/1795 [00:12<00:03, 110.42ba/s]\u001b[A\n",
-      " 77%|█████████████████████████████████████████████████████████████████████████████████████████████████████                              | 1385/1795 [00:12<00:03, 111.32ba/s]\u001b[A\n",
-      " 78%|█████████████████████████████████████████████████████████████████████████████████████████████████████▉                             | 1397/1795 [00:12<00:03, 112.54ba/s]\u001b[A\n",
-      " 78%|██████████████████████████████████████████████████████████████████████████████████████████████████████▊                            | 1409/1795 [00:12<00:03, 112.91ba/s]\u001b[A\n",
-      " 79%|███████████████████████████████████████████████████████████████████████████████████████████████████████▋                           | 1421/1795 [00:12<00:03, 111.93ba/s]\u001b[A\n",
-      " 80%|████████████████████████████████████████████████████████████████████████████████████████████████████████▌                          | 1433/1795 [00:12<00:03, 109.91ba/s]\u001b[A\n",
-      " 81%|█████████████████████████████████████████████████████████████████████████████████████████████████████████▍                         | 1445/1795 [00:13<00:03, 109.29ba/s]\u001b[A\n",
-      " 81%|██████████████████████████████████████████████████████████████████████████████████████████████████████████▎                        | 1456/1795 [00:13<00:03, 107.81ba/s]\u001b[A\n",
-      " 82%|███████████████████████████████████████████████████████████████████████████████████████████████████████████                        | 1467/1795 [00:13<00:03, 107.59ba/s]\u001b[A\n",
-      " 82%|███████████████████████████████████████████████████████████████████████████████████████████████████████████▉                       | 1479/1795 [00:13<00:02, 107.83ba/s]\u001b[A\n",
-      " 83%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▊                      | 1491/1795 [00:13<00:02, 108.92ba/s]\u001b[A\n",
-      " 84%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████▌                     | 1502/1795 [00:13<00:02, 108.64ba/s]\u001b[A\n",
-      " 84%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▍                    | 1514/1795 [00:13<00:02, 110.24ba/s]\u001b[A\n",
-      " 85%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████▎                   | 1526/1795 [00:13<00:02, 111.64ba/s]\u001b[A\n",
-      " 86%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏                  | 1538/1795 [00:13<00:02, 110.08ba/s]\u001b[A\n",
-      " 86%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████                  | 1550/1795 [00:14<00:02, 108.01ba/s]\u001b[A\n",
-      " 87%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉                 | 1562/1795 [00:14<00:02, 109.96ba/s]\u001b[A\n",
-      " 88%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊                | 1574/1795 [00:14<00:02, 109.67ba/s]\u001b[A\n",
-      " 88%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋               | 1585/1795 [00:14<00:01, 107.92ba/s]\u001b[A\n",
-      " 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍              | 1596/1795 [00:14<00:01, 108.38ba/s]\u001b[A\n",
-      " 90%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍             | 1609/1795 [00:14<00:01, 112.44ba/s]\u001b[A\n",
-      " 90%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎            | 1621/1795 [00:14<00:01, 110.29ba/s]\u001b[A\n",
-      " 91%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏           | 1633/1795 [00:14<00:01, 110.18ba/s]\u001b[A\n",
-      " 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████           | 1645/1795 [00:14<00:01, 108.21ba/s]\u001b[A\n",
-      " 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊          | 1656/1795 [00:15<00:01, 107.62ba/s]\u001b[A\n",
-      " 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋         | 1667/1795 [00:15<00:01, 106.66ba/s]\u001b[A\n",
-      " 93%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍        | 1678/1795 [00:15<00:01, 104.97ba/s]\u001b[A\n",
-      " 94%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎       | 1689/1795 [00:15<00:01, 105.67ba/s]\u001b[A\n",
-      " 95%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████       | 1700/1795 [00:15<00:00, 106.08ba/s]\u001b[A\n",
-      " 95%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉      | 1712/1795 [00:15<00:00, 107.07ba/s]\u001b[A\n",
-      " 96%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊     | 1724/1795 [00:15<00:00, 108.53ba/s]\u001b[A\n",
-      " 97%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌    | 1735/1795 [00:15<00:00, 108.05ba/s]\u001b[A\n",
-      " 97%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍   | 1747/1795 [00:15<00:00, 110.64ba/s]\u001b[A\n",
-      " 98%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎  | 1759/1795 [00:15<00:00, 111.38ba/s]\u001b[A\n",
-      " 99%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 1771/1795 [00:16<00:00, 110.67ba/s]\u001b[A\n",
-      " 99%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 1783/1795 [00:16<00:00, 110.52ba/s]\u001b[A\n",
-      "100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1795/1795 [00:16<00:00, 109.98ba/s]\u001b[A\n",
-      "\n",
-      "  0%|                                                                                                                                                 | 0/84 [00:00<?, ?ba/s]\u001b[A\n",
-      " 14%|███████████████████▎                                                                                                                   | 12/84 [00:00<00:00, 110.99ba/s]\u001b[A\n",
-      " 29%|██████████████████████████████████████▌                                                                                                | 24/84 [00:00<00:00, 110.80ba/s]\u001b[A\n",
-      " 43%|█████████████████████████████████████████████████████████▊                                                                             | 36/84 [00:00<00:00, 107.75ba/s]\u001b[A\n",
-      " 56%|███████████████████████████████████████████████████████████████████████████▌                                                           | 47/84 [00:00<00:00, 103.83ba/s]\u001b[A\n",
-      " 69%|█████████████████████████████████████████████████████████████████████████████████████████████▏                                         | 58/84 [00:00<00:00, 102.87ba/s]\u001b[A\n",
-      " 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▉                        | 69/84 [00:00<00:00, 104.54ba/s]\u001b[A\n",
-      "100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 84/84 [00:00<00:00, 106.09ba/s]\u001b[A\n",
-      "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [1]\n",
-      "\n",
-      "  | Name  | Type                       | Params\n",
-      "-----------------------------------------------------\n",
-      "0 | model | T5ForConditionalGeneration | 60.5 M\n",
-      "-----------------------------------------------------\n",
-      "60.5 M    Trainable params\n",
-      "0         Non-trainable params\n",
-      "60.5 M    Total params\n",
-      "242.026   Total estimated model params size (MB)\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Sanity Checking DataLoader 0:   0%|                                                                                                                    | 0/2 [00:00<?, ?it/s]"
-     ]
-    },
-    {
-     "ename": "AttributeError",
-     "evalue": "'list' object has no attribute 'size'",
-     "output_type": "error",
-     "traceback": [
-      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
-      "\u001b[0;31mAttributeError\u001b[0m                            Traceback (most recent call last)",
-      "Cell \u001b[0;32mIn[8], line 5\u001b[0m\n\u001b[1;32m      3\u001b[0m trainer \u001b[38;5;241m=\u001b[39m pl\u001b[38;5;241m.\u001b[39mTrainer(accelerator\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mgpu\u001b[39m\u001b[38;5;124m\"\u001b[39m, devices\u001b[38;5;241m=\u001b[39m[\u001b[38;5;241m0\u001b[39m], max_epochs\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m10\u001b[39m)\n\u001b[1;32m      4\u001b[0m dm \u001b[38;5;241m=\u001b[39m MyDataModule(batch_size\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m16\u001b[39m)\n\u001b[0;32m----> 5\u001b[0m \u001b[43mtrainer\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mfit\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mdatamodule\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdm\u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:608\u001b[0m, in \u001b[0;36mTrainer.fit\u001b[0;34m(self, model, train_dataloaders, val_dataloaders, datamodule, ckpt_path)\u001b[0m\n\u001b[1;32m    606\u001b[0m     \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mTypeError\u001b[39;00m(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m`Trainer.fit()` requires a `LightningModule`, got: \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mmodel\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__class__\u001b[39m\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__qualname__\u001b[39m\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m    607\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mstrategy\u001b[38;5;241m.\u001b[39m_lightning_module \u001b[38;5;241m=\u001b[39m model\n\u001b[0;32m--> 608\u001b[0m \u001b[43mcall\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_call_and_handle_interrupt\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m    609\u001b[0m \u001b[43m    \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_fit_impl\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmodel\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mtrain_dataloaders\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mval_dataloaders\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mdatamodule\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mckpt_path\u001b[49m\n\u001b[1;32m    610\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/call.py:38\u001b[0m, in \u001b[0;36m_call_and_handle_interrupt\u001b[0;34m(trainer, trainer_fn, *args, **kwargs)\u001b[0m\n\u001b[1;32m     36\u001b[0m         \u001b[38;5;28;01mreturn\u001b[39;00m trainer\u001b[38;5;241m.\u001b[39mstrategy\u001b[38;5;241m.\u001b[39mlauncher\u001b[38;5;241m.\u001b[39mlaunch(trainer_fn, \u001b[38;5;241m*\u001b[39margs, trainer\u001b[38;5;241m=\u001b[39mtrainer, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)\n\u001b[1;32m     37\u001b[0m     \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m---> 38\u001b[0m         \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mtrainer_fn\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     40\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m _TunerExitException:\n\u001b[1;32m     41\u001b[0m     trainer\u001b[38;5;241m.\u001b[39m_call_teardown_hook()\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:650\u001b[0m, in \u001b[0;36mTrainer._fit_impl\u001b[0;34m(self, model, train_dataloaders, val_dataloaders, datamodule, ckpt_path)\u001b[0m\n\u001b[1;32m    643\u001b[0m ckpt_path \u001b[38;5;241m=\u001b[39m ckpt_path \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mresume_from_checkpoint\n\u001b[1;32m    644\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_ckpt_path \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_checkpoint_connector\u001b[38;5;241m.\u001b[39m_set_ckpt_path(\n\u001b[1;32m    645\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mstate\u001b[38;5;241m.\u001b[39mfn,\n\u001b[1;32m    646\u001b[0m     ckpt_path,  \u001b[38;5;66;03m# type: ignore[arg-type]\u001b[39;00m\n\u001b[1;32m    647\u001b[0m     model_provided\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m,\n\u001b[1;32m    648\u001b[0m     model_connected\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlightning_module \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m,\n\u001b[1;32m    649\u001b[0m )\n\u001b[0;32m--> 650\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_run\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mckpt_path\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mckpt_path\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    652\u001b[0m \u001b[38;5;28;01massert\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mstate\u001b[38;5;241m.\u001b[39mstopped\n\u001b[1;32m    653\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mtraining \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:1103\u001b[0m, in \u001b[0;36mTrainer._run\u001b[0;34m(self, model, ckpt_path)\u001b[0m\n\u001b[1;32m   1099\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_checkpoint_connector\u001b[38;5;241m.\u001b[39mrestore_training_state()\n\u001b[1;32m   1101\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_checkpoint_connector\u001b[38;5;241m.\u001b[39mresume_end()\n\u001b[0;32m-> 1103\u001b[0m results \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_run_stage\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1105\u001b[0m log\u001b[38;5;241m.\u001b[39mdetail(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;132;01m{\u001b[39;00m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__class__\u001b[39m\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__name__\u001b[39m\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m: trainer tearing down\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m   1106\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_teardown()\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:1182\u001b[0m, in \u001b[0;36mTrainer._run_stage\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m   1180\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mpredicting:\n\u001b[1;32m   1181\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_run_predict()\n\u001b[0;32m-> 1182\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_run_train\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:1195\u001b[0m, in \u001b[0;36mTrainer._run_train\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m   1192\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_pre_training_routine()\n\u001b[1;32m   1194\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m isolate_rng():\n\u001b[0;32m-> 1195\u001b[0m     \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_run_sanity_check\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1197\u001b[0m \u001b[38;5;66;03m# enable train mode\u001b[39;00m\n\u001b[1;32m   1198\u001b[0m \u001b[38;5;28;01massert\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:1267\u001b[0m, in \u001b[0;36mTrainer._run_sanity_check\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m   1265\u001b[0m \u001b[38;5;66;03m# run eval step\u001b[39;00m\n\u001b[1;32m   1266\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m torch\u001b[38;5;241m.\u001b[39mno_grad():\n\u001b[0;32m-> 1267\u001b[0m     \u001b[43mval_loop\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrun\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1269\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_call_callback_hooks(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mon_sanity_check_end\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m   1271\u001b[0m \u001b[38;5;66;03m# reset logger connector\u001b[39;00m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/loops/loop.py:199\u001b[0m, in \u001b[0;36mLoop.run\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m    197\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[1;32m    198\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mon_advance_start(\u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)\n\u001b[0;32m--> 199\u001b[0m     \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43madvance\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    200\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mon_advance_end()\n\u001b[1;32m    201\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_restarting \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/loops/dataloader/evaluation_loop.py:152\u001b[0m, in \u001b[0;36mEvaluationLoop.advance\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m    150\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mnum_dataloaders \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m1\u001b[39m:\n\u001b[1;32m    151\u001b[0m     kwargs[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mdataloader_idx\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m=\u001b[39m dataloader_idx\n\u001b[0;32m--> 152\u001b[0m dl_outputs \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mepoch_loop\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrun\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_data_fetcher\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mdl_max_batches\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    154\u001b[0m \u001b[38;5;66;03m# store batch level output per dataloader\u001b[39;00m\n\u001b[1;32m    155\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_outputs\u001b[38;5;241m.\u001b[39mappend(dl_outputs)\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/loops/loop.py:199\u001b[0m, in \u001b[0;36mLoop.run\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m    197\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[1;32m    198\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mon_advance_start(\u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)\n\u001b[0;32m--> 199\u001b[0m     \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43madvance\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    200\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mon_advance_end()\n\u001b[1;32m    201\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_restarting \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/loops/epoch/evaluation_epoch_loop.py:137\u001b[0m, in \u001b[0;36mEvaluationEpochLoop.advance\u001b[0;34m(self, data_fetcher, dl_max_batches, kwargs)\u001b[0m\n\u001b[1;32m    134\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mbatch_progress\u001b[38;5;241m.\u001b[39mincrement_started()\n\u001b[1;32m    136\u001b[0m \u001b[38;5;66;03m# lightning module methods\u001b[39;00m\n\u001b[0;32m--> 137\u001b[0m output \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_evaluation_step\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    138\u001b[0m output \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_evaluation_step_end(output)\n\u001b[1;32m    140\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mbatch_progress\u001b[38;5;241m.\u001b[39mincrement_processed()\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/loops/epoch/evaluation_epoch_loop.py:234\u001b[0m, in \u001b[0;36mEvaluationEpochLoop._evaluation_step\u001b[0;34m(self, **kwargs)\u001b[0m\n\u001b[1;32m    223\u001b[0m \u001b[38;5;250m\u001b[39m\u001b[38;5;124;03m\"\"\"The evaluation step (validation_step or test_step depending on the trainer's state).\u001b[39;00m\n\u001b[1;32m    224\u001b[0m \n\u001b[1;32m    225\u001b[0m \u001b[38;5;124;03mArgs:\u001b[39;00m\n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m    231\u001b[0m \u001b[38;5;124;03m    the outputs of the step\u001b[39;00m\n\u001b[1;32m    232\u001b[0m \u001b[38;5;124;03m\"\"\"\u001b[39;00m\n\u001b[1;32m    233\u001b[0m hook_name \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mtest_step\u001b[39m\u001b[38;5;124m\"\u001b[39m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mtrainer\u001b[38;5;241m.\u001b[39mtesting \u001b[38;5;28;01melse\u001b[39;00m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mvalidation_step\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[0;32m--> 234\u001b[0m output \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mtrainer\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_call_strategy_hook\u001b[49m\u001b[43m(\u001b[49m\u001b[43mhook_name\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mvalues\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    236\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m output\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:1485\u001b[0m, in \u001b[0;36mTrainer._call_strategy_hook\u001b[0;34m(self, hook_name, *args, **kwargs)\u001b[0m\n\u001b[1;32m   1482\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m\n\u001b[1;32m   1484\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mprofiler\u001b[38;5;241m.\u001b[39mprofile(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m[Strategy]\u001b[39m\u001b[38;5;132;01m{\u001b[39;00m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mstrategy\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__class__\u001b[39m\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__name__\u001b[39m\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m.\u001b[39m\u001b[38;5;132;01m{\u001b[39;00mhook_name\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m):\n\u001b[0;32m-> 1485\u001b[0m     output \u001b[38;5;241m=\u001b[39m \u001b[43mfn\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1487\u001b[0m \u001b[38;5;66;03m# restore current_fx when nested context\u001b[39;00m\n\u001b[1;32m   1488\u001b[0m pl_module\u001b[38;5;241m.\u001b[39m_current_fx_name \u001b[38;5;241m=\u001b[39m prev_fx_name\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/strategies/strategy.py:390\u001b[0m, in \u001b[0;36mStrategy.validation_step\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m    388\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mprecision_plugin\u001b[38;5;241m.\u001b[39mval_step_context():\n\u001b[1;32m    389\u001b[0m     \u001b[38;5;28;01massert\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel, ValidationStep)\n\u001b[0;32m--> 390\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mvalidation_step\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n",
-      "Cell \u001b[0;32mIn[7], line 36\u001b[0m, in \u001b[0;36mMyLightningModule.validation_step\u001b[0;34m(self, batch, batch_idx)\u001b[0m\n\u001b[1;32m     34\u001b[0m attention_mask \u001b[38;5;241m=\u001b[39m batch[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mattention_mask\u001b[39m\u001b[38;5;124m\"\u001b[39m]\n\u001b[1;32m     35\u001b[0m labels \u001b[38;5;241m=\u001b[39m batch[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mlabels\u001b[39m\u001b[38;5;124m\"\u001b[39m]\n\u001b[0;32m---> 36\u001b[0m loss, logits \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[43m(\u001b[49m\u001b[43minput_ids\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mattention_mask\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mlabels\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     37\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlog(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mval_loss\u001b[39m\u001b[38;5;124m'\u001b[39m, loss, on_epoch\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m, on_step\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mFalse\u001b[39;00m)\n\u001b[1;32m     38\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m {\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mloss\u001b[39m\u001b[38;5;124m'\u001b[39m: loss, \u001b[38;5;124m'\u001b[39m\u001b[38;5;124mlogits\u001b[39m\u001b[38;5;124m'\u001b[39m: logits, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mlabels\u001b[39m\u001b[38;5;124m\"\u001b[39m:labels}\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/torch/nn/modules/module.py:1194\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *input, **kwargs)\u001b[0m\n\u001b[1;32m   1190\u001b[0m \u001b[38;5;66;03m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m   1191\u001b[0m \u001b[38;5;66;03m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m   1192\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m (\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m   1193\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> 1194\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mforward_call\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;28;43minput\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1195\u001b[0m \u001b[38;5;66;03m# Do not call functions when jit is used\u001b[39;00m\n\u001b[1;32m   1196\u001b[0m full_backward_hooks, non_full_backward_hooks \u001b[38;5;241m=\u001b[39m [], []\n",
-      "Cell \u001b[0;32mIn[7], line 16\u001b[0m, in \u001b[0;36mMyLightningModule.forward\u001b[0;34m(self, input_ids, attention_mask, labels)\u001b[0m\n\u001b[1;32m     15\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mforward\u001b[39m(\u001b[38;5;28mself\u001b[39m, input_ids, attention_mask, labels\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m):\n\u001b[0;32m---> 16\u001b[0m     output \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m     17\u001b[0m \u001b[43m        \u001b[49m\u001b[43minput_ids\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43minput_ids\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m     18\u001b[0m \u001b[43m        \u001b[49m\u001b[43mattention_mask\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mattention_mask\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m     19\u001b[0m \u001b[43m        \u001b[49m\u001b[43mlabels\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mlabels\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m     20\u001b[0m \u001b[43m    \u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     21\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m output\u001b[38;5;241m.\u001b[39mloss, output\u001b[38;5;241m.\u001b[39mlogits\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/torch/nn/modules/module.py:1194\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *input, **kwargs)\u001b[0m\n\u001b[1;32m   1190\u001b[0m \u001b[38;5;66;03m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m   1191\u001b[0m \u001b[38;5;66;03m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m   1192\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m (\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m   1193\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> 1194\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mforward_call\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;28;43minput\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1195\u001b[0m \u001b[38;5;66;03m# Do not call functions when jit is used\u001b[39;00m\n\u001b[1;32m   1196\u001b[0m full_backward_hooks, non_full_backward_hooks \u001b[38;5;241m=\u001b[39m [], []\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/transformers/models/t5/modeling_t5.py:1624\u001b[0m, in \u001b[0;36mT5ForConditionalGeneration.forward\u001b[0;34m(self, input_ids, attention_mask, decoder_input_ids, decoder_attention_mask, head_mask, decoder_head_mask, cross_attn_head_mask, encoder_outputs, past_key_values, inputs_embeds, decoder_inputs_embeds, labels, use_cache, output_attentions, output_hidden_states, return_dict)\u001b[0m\n\u001b[1;32m   1621\u001b[0m \u001b[38;5;66;03m# Encode if needed (training, first prediction pass)\u001b[39;00m\n\u001b[1;32m   1622\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m encoder_outputs \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[1;32m   1623\u001b[0m     \u001b[38;5;66;03m# Convert encoder inputs in embeddings if needed\u001b[39;00m\n\u001b[0;32m-> 1624\u001b[0m     encoder_outputs \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mencoder\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m   1625\u001b[0m \u001b[43m        \u001b[49m\u001b[43minput_ids\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43minput_ids\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1626\u001b[0m \u001b[43m        \u001b[49m\u001b[43mattention_mask\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mattention_mask\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1627\u001b[0m \u001b[43m        \u001b[49m\u001b[43minputs_embeds\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43minputs_embeds\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1628\u001b[0m \u001b[43m        \u001b[49m\u001b[43mhead_mask\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mhead_mask\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1629\u001b[0m \u001b[43m        \u001b[49m\u001b[43moutput_attentions\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43moutput_attentions\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1630\u001b[0m \u001b[43m        \u001b[49m\u001b[43moutput_hidden_states\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43moutput_hidden_states\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1631\u001b[0m \u001b[43m        \u001b[49m\u001b[43mreturn_dict\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mreturn_dict\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1632\u001b[0m \u001b[43m    \u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1633\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m return_dict \u001b[38;5;129;01mand\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(encoder_outputs, BaseModelOutput):\n\u001b[1;32m   1634\u001b[0m     encoder_outputs \u001b[38;5;241m=\u001b[39m BaseModelOutput(\n\u001b[1;32m   1635\u001b[0m         last_hidden_state\u001b[38;5;241m=\u001b[39mencoder_outputs[\u001b[38;5;241m0\u001b[39m],\n\u001b[1;32m   1636\u001b[0m         hidden_states\u001b[38;5;241m=\u001b[39mencoder_outputs[\u001b[38;5;241m1\u001b[39m] \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mlen\u001b[39m(encoder_outputs) \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m1\u001b[39m \u001b[38;5;28;01melse\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m,\n\u001b[1;32m   1637\u001b[0m         attentions\u001b[38;5;241m=\u001b[39mencoder_outputs[\u001b[38;5;241m2\u001b[39m] \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mlen\u001b[39m(encoder_outputs) \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m2\u001b[39m \u001b[38;5;28;01melse\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m,\n\u001b[1;32m   1638\u001b[0m     )\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/torch/nn/modules/module.py:1194\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *input, **kwargs)\u001b[0m\n\u001b[1;32m   1190\u001b[0m \u001b[38;5;66;03m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m   1191\u001b[0m \u001b[38;5;66;03m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m   1192\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m (\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m   1193\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> 1194\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mforward_call\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;28;43minput\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1195\u001b[0m \u001b[38;5;66;03m# Do not call functions when jit is used\u001b[39;00m\n\u001b[1;32m   1196\u001b[0m full_backward_hooks, non_full_backward_hooks \u001b[38;5;241m=\u001b[39m [], []\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/transformers/models/t5/modeling_t5.py:944\u001b[0m, in \u001b[0;36mT5Stack.forward\u001b[0;34m(self, input_ids, attention_mask, encoder_hidden_states, encoder_attention_mask, inputs_embeds, head_mask, cross_attn_head_mask, past_key_values, use_cache, output_attentions, output_hidden_states, return_dict)\u001b[0m\n\u001b[1;32m    940\u001b[0m     \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\n\u001b[1;32m    941\u001b[0m         \u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mYou cannot specify both \u001b[39m\u001b[38;5;132;01m{\u001b[39;00merr_msg_prefix\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124minput_ids and \u001b[39m\u001b[38;5;132;01m{\u001b[39;00merr_msg_prefix\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124minputs_embeds at the same time\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[1;32m    942\u001b[0m     )\n\u001b[1;32m    943\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m input_ids \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[0;32m--> 944\u001b[0m     input_shape \u001b[38;5;241m=\u001b[39m \u001b[43minput_ids\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43msize\u001b[49m()\n\u001b[1;32m    945\u001b[0m     input_ids \u001b[38;5;241m=\u001b[39m input_ids\u001b[38;5;241m.\u001b[39mview(\u001b[38;5;241m-\u001b[39m\u001b[38;5;241m1\u001b[39m, input_shape[\u001b[38;5;241m-\u001b[39m\u001b[38;5;241m1\u001b[39m])\n\u001b[1;32m    946\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m inputs_embeds \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n",
-      "\u001b[0;31mAttributeError\u001b[0m: 'list' object has no attribute 'size'"
-     ]
-    }
-   ],
-   "source": [
-    "torch.set_float32_matmul_precision(\"medium\")\n",
-    "model = MyLightningModule(model_name=\"t5-small\", learning_rate=1e-5, weight_decay=1e-4, batch_size=16)\n",
-    "trainer = pl.Trainer(accelerator=\"gpu\", devices=[0], max_epochs=10)\n",
-    "dm = MyDataModule(batch_size=16)\n",
-    "trainer.fit(model, datamodule=dm)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1395d5d2",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "80a2efab",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.9"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/ML/Pytorch/huggingface/.ipynb_checkpoints/finetuning_t5_small_cnndaily-checkpoint.ipynb b/ML/Pytorch/huggingface/.ipynb_checkpoints/finetuning_t5_small_cnndaily-checkpoint.ipynb
deleted file mode 100644
index 8cfe998..0000000
--- a/ML/Pytorch/huggingface/.ipynb_checkpoints/finetuning_t5_small_cnndaily-checkpoint.ipynb
+++ /dev/null
@@ -1,3585 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": 7,
-   "id": "bd8e3b95",
-   "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "<style> div#notebook {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " line-height: 170%;\n",
-       " color: #cdd2e9;\n",
-       " -webkit-font-smoothing: antialiased !important;\n",
-       " padding-top: 25px !important;\n",
-       "}\n",
-       "body,\n",
-       "div.body {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " color: #a2b0c7;\n",
-       " background-color: #1a2028;\n",
-       " background: #1a2028;\n",
-       " -webkit-font-smoothing: antialiased !important;\n",
-       "}\n",
-       "body.notebook_app {\n",
-       " padding: 0;\n",
-       " background-color: #1a2028;\n",
-       " background: #1a2028;\n",
-       " padding-right: 0px !important;\n",
-       " overflow-y: hidden;\n",
-       "}\n",
-       "a {\n",
-       " font-family: sans-serif;\n",
-       " color: #a2b0c7;\n",
-       " -webkit-font-smoothing: antialiased !important;\n",
-       "}\n",
-       "a:hover,\n",
-       "a:focus {\n",
-       " color: #dbe1ea;\n",
-       " -webkit-font-smoothing: antialiased !important;\n",
-       "}\n",
-       "div#maintoolbar {\n",
-       " position: absolute;\n",
-       " width: 90%;\n",
-       " margin-left: -10%;\n",
-       " padding-right: 8%;\n",
-       " float: left;\n",
-       " background: transparent !important;\n",
-       "}\n",
-       "#maintoolbar {\n",
-       " margin-bottom: -3px;\n",
-       " margin-top: 0px;\n",
-       " border: 0px;\n",
-       " min-height: 27px;\n",
-       " padding-top: 2px;\n",
-       " padding-bottom: 0px;\n",
-       "}\n",
-       "#maintoolbar .container {\n",
-       " width: 75%;\n",
-       " margin-right: auto;\n",
-       " margin-left: auto;\n",
-       "}\n",
-       ".list_header,\n",
-       "div#notebook_list_header.row.list_header {\n",
-       " font-size: 14pt;\n",
-       " color: #dbe1ea;\n",
-       " background-color: transparent;\n",
-       " height: 35px;\n",
-       "}\n",
-       "i.fa.fa-folder {\n",
-       " display: inline-block;\n",
-       " font: normal normal normal 14px \"FontAwesome\";\n",
-       " font-family: \"FontAwesome\" !important;\n",
-       " text-rendering: auto;\n",
-       " -webkit-font-smoothing: antialiased;\n",
-       " font-size: 18px;\n",
-       " -moz-osx-font-smoothing: grayscale;\n",
-       "}\n",
-       "#running .panel-group .panel .panel-heading {\n",
-       " font-size: 14pt;\n",
-       " color: #a2b0c7;\n",
-       " padding: 8px 8px;\n",
-       " background: #252b35;\n",
-       " background-color: #252b35;\n",
-       "}\n",
-       "#running .panel-group .panel .panel-heading a {\n",
-       " font-size: 14pt;\n",
-       " color: #a2b0c7;\n",
-       "}\n",
-       "#running .panel-group .panel .panel-heading a:focus,\n",
-       "#running .panel-group .panel .panel-heading a:hover {\n",
-       " font-size: 14pt;\n",
-       " color: #a2b0c7;\n",
-       "}\n",
-       "#running .panel-group .panel .panel-body .list_container .list_item {\n",
-       " background: #2d3846;\n",
-       " background-color: #2d3846;\n",
-       " padding: 2px;\n",
-       " border-bottom: 2px solid rgba(75,95,118,.30);\n",
-       "}\n",
-       "#running .panel-group .panel .panel-body .list_container .list_item:hover {\n",
-       " background: #2d3846;\n",
-       " background-color: #2d3846;\n",
-       "}\n",
-       "#running .panel-group .panel .panel-body {\n",
-       " padding: 2px;\n",
-       "}\n",
-       "button#refresh_running_list {\n",
-       " border: none !important;\n",
-       "}\n",
-       "button#refresh_cluster_list {\n",
-       " border: none !important;\n",
-       "}\n",
-       "div.running_list_info.toolbar_info {\n",
-       " font-size: 15px;\n",
-       " padding: 4px 0 4px 0;\n",
-       " margin-top: 5px;\n",
-       " margin-bottom: 8px;\n",
-       " height: 24px;\n",
-       " line-height: 24px;\n",
-       " text-shadow: none;\n",
-       "}\n",
-       ".list_placeholder {\n",
-       " font-weight: normal;\n",
-       "}\n",
-       "#tree-selector {\n",
-       " padding: 0px;\n",
-       " border-color: transparent;\n",
-       "}\n",
-       "#project_name > ul > li > a > i.fa.fa-home {\n",
-       " color: #0b98c8;\n",
-       " font-size: 17pt;\n",
-       " display: inline-block;\n",
-       " position: static;\n",
-       " padding: 0px 0px;\n",
-       " font-weight: normal;\n",
-       " text-align: center;\n",
-       " vertical-align: text-top;\n",
-       "}\n",
-       ".fa-folder:before {\n",
-       " color: #4c8be2;\n",
-       "}\n",
-       ".fa-arrow-up:before {\n",
-       " font-size: 14px;\n",
-       "}\n",
-       ".fa-arrow-down:before {\n",
-       " font-size: 14px;\n",
-       "}\n",
-       "span#last-modified.btn.btn-xs.btn-default.sort-action:hover .fa,\n",
-       "span#sort-name.btn.btn-xs.btn-default.sort-action:hover .fa {\n",
-       " color: #009cd1;\n",
-       "}\n",
-       ".folder_icon:before {\n",
-       " display: inline-block;\n",
-       " font: normal normal normal 14px/1 FontAwesome;\n",
-       " font-size: inherit;\n",
-       " text-rendering: auto;\n",
-       " -webkit-font-smoothing: antialiased;\n",
-       " -moz-osx-font-smoothing: grayscale;\n",
-       " content: \"\\f07b\";\n",
-       " color: #4c8be2;\n",
-       "}\n",
-       ".notebook_icon:before {\n",
-       " display: inline-block;\n",
-       " font: normal normal normal 14px/1 FontAwesome;\n",
-       " font-size: inherit;\n",
-       " text-rendering: auto;\n",
-       " -webkit-font-smoothing: antialiased;\n",
-       " -moz-osx-font-smoothing: grayscale;\n",
-       " content: \"\\f02d\";\n",
-       " position: relative;\n",
-       " color: #48a667 !important;\n",
-       " top: 0px;\n",
-       "}\n",
-       ".file_icon:before {\n",
-       " display: inline-block;\n",
-       " font: normal normal normal 14px/1 FontAwesome;\n",
-       " font-size: inherit;\n",
-       " text-rendering: auto;\n",
-       " -webkit-font-smoothing: antialiased;\n",
-       " -moz-osx-font-smoothing: grayscale;\n",
-       " content: \"\\f15b\";\n",
-       " position: relative;\n",
-       " top: 0px;\n",
-       " color: #92a2bd !important;\n",
-       "}\n",
-       "#project_name a {\n",
-       " display: inline-flex;\n",
-       " padding-left: 7px;\n",
-       " margin-left: -2px;\n",
-       " text-align: -webkit-auto;\n",
-       " vertical-align: baseline;\n",
-       " font-size: 18px;\n",
-       "}\n",
-       "div#notebook_toolbar div.dynamic-instructions {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 17px;\n",
-       " color: #546386;\n",
-       "}\n",
-       "span#login_widget > .button,\n",
-       "#logout {\n",
-       " font-family: \"Proxima Nova\", sans-serif;\n",
-       " color: #a2b0c7;\n",
-       " background: transparent;\n",
-       " background-color: transparent;\n",
-       " border: 2px solid #252e3a;\n",
-       " font-weight: normal;\n",
-       " box-shadow: none;\n",
-       " text-shadow: none;\n",
-       " border-radius: 3px;\n",
-       " margin-right: 10px;\n",
-       " padding: 2px 7px;\n",
-       "}\n",
-       "span#login_widget > .button:hover,\n",
-       "#logout:hover {\n",
-       " color: #009cd1;\n",
-       " background-color: transparent;\n",
-       " background: transparent;\n",
-       " border: 2px solid #009cd1;\n",
-       " background-image: none;\n",
-       " box-shadow: none !important;\n",
-       " border-radius: 3px;\n",
-       "}\n",
-       "span#login_widget > .button:focus,\n",
-       "#logout:focus,\n",
-       "span#login_widget > .button.focus,\n",
-       "#logout.focus,\n",
-       "span#login_widget > .button:active,\n",
-       "#logout:active,\n",
-       "span#login_widget > .button.active,\n",
-       "#logout.active,\n",
-       ".open > .dropdown-togglespan#login_widget > .button,\n",
-       ".open > .dropdown-toggle#logout {\n",
-       " color: #fefefe;\n",
-       " background-color: #a2b0c7;\n",
-       " background: #a2b0c7;\n",
-       " border-color: #a2b0c7;\n",
-       " background-image: none;\n",
-       " box-shadow: none !important;\n",
-       " border-radius: 2px;\n",
-       "}\n",
-       "body > #header #header-container {\n",
-       " padding-bottom: 0px;\n",
-       " padding-top: 4px;\n",
-       " box-sizing: border-box;\n",
-       " -moz-box-sizing: border-box;\n",
-       " -webkit-box-sizing: border-box;\n",
-       "}\n",
-       "body > #header {\n",
-       " background: #1a2028;\n",
-       " background-color: #1a2028;\n",
-       " position: relative;\n",
-       " z-index: 100;\n",
-       "}\n",
-       ".list_container {\n",
-       " font-size: 13pt;\n",
-       " color: #a2b0c7;\n",
-       " border: none;\n",
-       " text-shadow: none !important;\n",
-       "}\n",
-       ".list_container > div {\n",
-       " border-bottom: 1px solid rgba(75,95,118,.30);\n",
-       " font-size: 13pt;\n",
-       "}\n",
-       ".list_header > div,\n",
-       ".list_item > div {\n",
-       " padding-top: 6px;\n",
-       " padding-bottom: 2px;\n",
-       " padding-left: 0px;\n",
-       "}\n",
-       ".list_header > div .item_link,\n",
-       ".list_item > div .item_link {\n",
-       " margin-left: -1px;\n",
-       " vertical-align: middle;\n",
-       " line-height: 22px;\n",
-       " font-size: 13pt;\n",
-       "}\n",
-       ".item_icon {\n",
-       " color: #4c8be2;\n",
-       " font-size: 13pt;\n",
-       " vertical-align: middle;\n",
-       "}\n",
-       ".list_item input:not([type=\"checkbox\"]) {\n",
-       " padding-right: 0px;\n",
-       " height: 1.75em;\n",
-       " width: 25%;\n",
-       " margin: 0px 0 0;\n",
-       " margin-top: 0px;\n",
-       "}\n",
-       ".list_header > div .item_link,\n",
-       ".list_item > div .item_link {\n",
-       " margin-left: -1px;\n",
-       " vertical-align: middle;\n",
-       " line-height: 1.5em;\n",
-       " font-size: 12pt;\n",
-       " display: inline-table;\n",
-       " position: static;\n",
-       "}\n",
-       "#button-select-all {\n",
-       " height: 34px;\n",
-       " min-width: 55px;\n",
-       " z-index: 0;\n",
-       " border: none !important;\n",
-       " padding-top: 0px;\n",
-       " padding-bottom: 0px;\n",
-       " margin-bottom: 0px;\n",
-       " margin-top: 0px;\n",
-       " left: -3px;\n",
-       " border-radius: 0px !important;\n",
-       "}\n",
-       "#button-select-all:focus,\n",
-       "#button-select-all:active:focus,\n",
-       "#button-select-all.active:focus,\n",
-       "#button-select-all.focus,\n",
-       "#button-select-all:active.focus,\n",
-       "#button-select-all.active.focus {\n",
-       " background-color: #252e3a !important;\n",
-       " background: #252e3a !important;\n",
-       "}\n",
-       "button#tree-selector-btn {\n",
-       " height: 34px;\n",
-       " font-size: 12.0pt;\n",
-       " border: none;\n",
-       " left: 0px;\n",
-       " border-radius: 0px !important;\n",
-       "}\n",
-       "input#select-all.pull-left.tree-selector {\n",
-       " margin-left: 7px;\n",
-       " margin-right: 2px;\n",
-       " margin-top: 2px;\n",
-       " top: 4px;\n",
-       "}\n",
-       "input[type=\"radio\"],\n",
-       "input[type=\"checkbox\"] {\n",
-       " margin-top: 1px;\n",
-       " line-height: normal;\n",
-       "}\n",
-       ".delete-button {\n",
-       " border: none !important;\n",
-       "}\n",
-       "i.fa.fa-trash {\n",
-       " font-size: 13.5pt;\n",
-       "}\n",
-       ".list_container a {\n",
-       " font-size: 16px;\n",
-       " color: #a2b0c7;\n",
-       " border: none;\n",
-       " text-shadow: none !important;\n",
-       " font-weight: normal;\n",
-       " font-style: normal;\n",
-       "}\n",
-       "div.list_container a:hover {\n",
-       " color: #dbe1ea;\n",
-       "}\n",
-       ".list_header > div input,\n",
-       ".list_item > div input {\n",
-       " margin-right: 7px;\n",
-       " margin-left: 12px;\n",
-       " vertical-align: baseline;\n",
-       " line-height: 22px;\n",
-       " position: relative;\n",
-       " top: -1px;\n",
-       "}\n",
-       "div.list_item:hover {\n",
-       " background-color: rgba(75,95,118,.10);\n",
-       "}\n",
-       ".breadcrumb > li {\n",
-       " font-size: 12.0pt;\n",
-       " color: #a2b0c7;\n",
-       " border: none;\n",
-       " text-shadow: none !important;\n",
-       "}\n",
-       ".breadcrumb > li + li:before {\n",
-       " content: \"/\\00a0\";\n",
-       " padding: 0px;\n",
-       " color: #a2b0c7;\n",
-       " font-size: 18px;\n",
-       "}\n",
-       "#project_name > .breadcrumb {\n",
-       " padding: 0px;\n",
-       " margin-bottom: 0px;\n",
-       " background-color: transparent;\n",
-       " font-weight: normal;\n",
-       " margin-top: -2px;\n",
-       "}\n",
-       "ul#tabs a {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13.5pt;\n",
-       " font-weight: normal;\n",
-       " font-style: normal;\n",
-       " text-shadow: none !important;\n",
-       "}\n",
-       ".nav-tabs {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13.5pt;\n",
-       " font-weight: normal;\n",
-       " font-style: normal;\n",
-       " background-color: transparent;\n",
-       " border-color: transparent;\n",
-       " text-shadow: none !important;\n",
-       " border: 2px solid transparent;\n",
-       "}\n",
-       ".nav-tabs > li > a:active,\n",
-       ".nav-tabs > li > a:focus,\n",
-       ".nav-tabs > li > a:hover,\n",
-       ".nav-tabs > li.active > a,\n",
-       ".nav-tabs > li.active > a:focus,\n",
-       ".nav-tabs > li.active > a:hover,\n",
-       ".nav-tabs > li.active > a,\n",
-       ".nav-tabs > li.active > a:hover,\n",
-       ".nav-tabs > li.active > a:focus {\n",
-       " color: #009cd1;\n",
-       " background-color: transparent;\n",
-       " border-color: transparent;\n",
-       " border-bottom: 2px solid transparent;\n",
-       "}\n",
-       ".nav > li.disabled > a,\n",
-       ".nav > li.disabled > a:hover {\n",
-       " color: #546386;\n",
-       "}\n",
-       ".nav-tabs > li > a:before {\n",
-       " content: \"\";\n",
-       " position: absolute;\n",
-       " width: 100%;\n",
-       " height: 2px;\n",
-       " bottom: -2px;\n",
-       " left: 0;\n",
-       " background-color: #009cd1;\n",
-       " visibility: hidden;\n",
-       " -webkit-transform: perspective(0)scaleX(0);\n",
-       " transform: perspective(0)scaleX(0);\n",
-       " -webkit-transition: ease 220ms;\n",
-       " transition: ease 220ms;\n",
-       " -webkit-font-smoothing: antialiased !important;\n",
-       "}\n",
-       ".nav-tabs > li > a:hover:before {\n",
-       " visibility: visible;\n",
-       " -webkit-transform: perspective(1)scaleX(1);\n",
-       " transform: perspective(1)scaleX(1);\n",
-       "}\n",
-       ".nav-tabs > li.active > a:before {\n",
-       " content: \"\";\n",
-       " position: absolute;\n",
-       " width: 100%;\n",
-       " height: 2px;\n",
-       " bottom: -2px;\n",
-       " left: 0;\n",
-       " background-color: #009cd1;\n",
-       " visibility: visible;\n",
-       " -webkit-transform: perspective(1)scaleX(1);\n",
-       " transform: perspective(1)scaleX(1);\n",
-       " -webkit-font-smoothing: subpixel-antialiased !important;\n",
-       "}\n",
-       "div#notebook {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " padding-top: 4px;\n",
-       "}\n",
-       ".notebook_app {\n",
-       " background-color: #1a2028;\n",
-       "}\n",
-       "#notebook-container {\n",
-       " padding: 13px 2px;\n",
-       " background-color: #1a2028;\n",
-       " min-height: 0px;\n",
-       " box-shadow: none;\n",
-       " width: 980px;\n",
-       " margin-right: auto;\n",
-       " margin-left: auto;\n",
-       "}\n",
-       "div#ipython-main-app.container {\n",
-       " width: 980px;\n",
-       " margin-right: auto;\n",
-       " margin-left: auto;\n",
-       " margin-right: auto;\n",
-       " margin-left: auto;\n",
-       "}\n",
-       ".container {\n",
-       " width: 980px;\n",
-       " margin-right: auto;\n",
-       " margin-left: auto;\n",
-       "}\n",
-       "div#menubar-container {\n",
-       " width: 100%;\n",
-       " width: 980px;\n",
-       "}\n",
-       "div#header-container {\n",
-       " width: 980px;\n",
-       "}\n",
-       ".notebook_app #header,\n",
-       ".edit_app #header {\n",
-       " box-shadow: none !important;\n",
-       " background-color: #1a2028;\n",
-       " border-bottom: 2px solid rgba(75,95,118,.30);\n",
-       "}\n",
-       "#header,\n",
-       ".edit_app #header {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " box-shadow: none;\n",
-       " background-color: #1a2028;\n",
-       "}\n",
-       "#header .header-bar,\n",
-       ".edit_app #header .header-bar {\n",
-       " background: #1a2028;\n",
-       " background-color: #1a2028;\n",
-       "}\n",
-       "body > #header .header-bar {\n",
-       " width: 100%;\n",
-       " background: #1a2028;\n",
-       "}\n",
-       "span.checkpoint_status,\n",
-       "span.autosave_status {\n",
-       " font-size: small;\n",
-       " display: none;\n",
-       "}\n",
-       "#menubar,\n",
-       "div#menubar {\n",
-       " background-color: #1a2028;\n",
-       " padding-top: 0px !important;\n",
-       "}\n",
-       "#menubar .navbar,\n",
-       ".navbar-default {\n",
-       " background-color: #1a2028;\n",
-       " margin-bottom: 0px;\n",
-       " margin-top: 0px;\n",
-       "}\n",
-       ".navbar {\n",
-       " border: none;\n",
-       "}\n",
-       "div.navbar-text,\n",
-       ".navbar-text,\n",
-       ".navbar-text.indicator_area,\n",
-       "p.navbar-text.indicator_area {\n",
-       " margin-top: 8px !important;\n",
-       " margin-bottom: 0px;\n",
-       " color: #0b98c8;\n",
-       "}\n",
-       ".navbar-default {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " background-color: #1a2028;\n",
-       " border-color: #323b48;\n",
-       " line-height: 1.5em;\n",
-       " padding-bottom: 0px;\n",
-       "}\n",
-       ".navbar-default .navbar-nav > li > a {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " color: #a2b0c7;\n",
-       " display: block;\n",
-       " line-height: 1.5em;\n",
-       " padding-top: 14px;\n",
-       " padding-bottom: 11px;\n",
-       "}\n",
-       ".navbar-default .navbar-nav > li > a:hover,\n",
-       ".navbar-default .navbar-nav > li > a:focus {\n",
-       " color: #dbe1ea !important;\n",
-       " background-color: rgba(75,95,118,.30) !important;\n",
-       " border-color: #323b48 !important;\n",
-       " line-height: 1.5em;\n",
-       " transition: 80ms ease;\n",
-       "}\n",
-       ".navbar-default .navbar-nav > .open > a,\n",
-       ".navbar-default .navbar-nav > .open > a:hover,\n",
-       ".navbar-default .navbar-nav > .open > a:focus {\n",
-       " color: #fefefe;\n",
-       " background-color: #36404e;\n",
-       " border-color: #36404e;\n",
-       " line-height: 1.5em;\n",
-       "}\n",
-       ".navbar-nav > li > .dropdown-menu {\n",
-       " margin-top: 0px;\n",
-       "}\n",
-       ".navbar-nav {\n",
-       " margin: 0;\n",
-       "}\n",
-       "div.notification_widget.info,\n",
-       ".notification_widget.info,\n",
-       ".notification_widget:active:hover,\n",
-       ".notification_widget.active:hover,\n",
-       ".open > .dropdown-toggle.notification_widget:hover,\n",
-       ".notification_widget:active:focus,\n",
-       ".notification_widget.active:focus,\n",
-       ".open > .dropdown-toggle.notification_widget:focus,\n",
-       ".notification_widget:active.focus,\n",
-       ".notification_widget.active.focus,\n",
-       ".open > .dropdown-toggle.notification_widget.focus,\n",
-       "div#notification_notebook.notification_widget.btn.btn-xs.navbar-btn,\n",
-       "div#notification_notebook.notification_widget.btn.btn-xs.navbar-btn:hover,\n",
-       "div#notification_notebook.notification_widget.btn.btn-xs.navbar-btn:focus {\n",
-       " color: #899ab8 !important;\n",
-       " background-color: transparent !important;\n",
-       " border-color: transparent !important;\n",
-       " padding-bottom: 0px !important;\n",
-       " margin-bottom: 0px !important;\n",
-       " font-size: 9pt !important;\n",
-       " z-index: 0;\n",
-       "}\n",
-       "div#notification_notebook.notification_widget.btn.btn-xs.navbar-btn {\n",
-       " font-size: 9pt !important;\n",
-       " z-index: 0;\n",
-       "}\n",
-       ".notification_widget {\n",
-       " color: #4c8be2;\n",
-       " z-index: -500;\n",
-       " font-size: 9pt;\n",
-       " background: transparent;\n",
-       " background-color: transparent;\n",
-       " margin-right: 3px;\n",
-       " border: none;\n",
-       "}\n",
-       ".notification_widget,\n",
-       "div.notification_widget {\n",
-       " margin-right: 0px;\n",
-       " margin-left: 0px;\n",
-       " padding-right: 0px;\n",
-       " vertical-align: text-top !important;\n",
-       " margin-top: 6px !important;\n",
-       " background: transparent !important;\n",
-       " background-color: transparent !important;\n",
-       " font-size: 9pt !important;\n",
-       " border: none;\n",
-       "}\n",
-       ".navbar-btn.btn-xs:hover {\n",
-       " border: none !important;\n",
-       " background: transparent !important;\n",
-       " background-color: transparent !important;\n",
-       " color: #a2b0c7 !important;\n",
-       "}\n",
-       "div.notification_widget.info,\n",
-       ".notification_widget.info {\n",
-       " display: none !important;\n",
-       "}\n",
-       ".edit_mode .modal_indicator:before {\n",
-       " display: none;\n",
-       "}\n",
-       ".command_mode .modal_indicator:before {\n",
-       " display: none;\n",
-       "}\n",
-       ".item_icon {\n",
-       " color: #4c8be2;\n",
-       "}\n",
-       ".item_buttons .kernel-name {\n",
-       " font-size: 13pt;\n",
-       " color: #4c8be2;\n",
-       "}\n",
-       ".running_notebook_icon:before {\n",
-       " color: #48a667 !important;\n",
-       " font: normal normal normal 15px/1 FontAwesome;\n",
-       " font-size: 15px;\n",
-       " text-rendering: auto;\n",
-       " -webkit-font-smoothing: antialiased;\n",
-       " -moz-osx-font-smoothing: grayscale;\n",
-       " content: \"\\f10c\";\n",
-       " vertical-align: middle;\n",
-       " position: static;\n",
-       " display: inherit;\n",
-       "}\n",
-       ".item_buttons .running-indicator {\n",
-       " padding-top: 4px;\n",
-       " color: #48a667;\n",
-       " font-family: sans-serif;\n",
-       " text-rendering: auto;\n",
-       " -webkit-font-smoothing: antialiased;\n",
-       "}\n",
-       "#notification_trusted {\n",
-       " font-family: sans-serif;\n",
-       " border: none;\n",
-       " background: transparent;\n",
-       " background-color: transparent;\n",
-       " margin-bottom: 0px !important;\n",
-       " vertical-align: bottom !important;\n",
-       " color: #546386 !important;\n",
-       " cursor: default !important;\n",
-       "}\n",
-       "#notification_area,\n",
-       "div.notification_area {\n",
-       " float: right !important;\n",
-       " position: static;\n",
-       " cursor: pointer;\n",
-       " padding-top: 6px;\n",
-       " padding-right: 4px;\n",
-       "}\n",
-       "div#notification_notebook.notification_widget.btn.btn-xs.navbar-btn {\n",
-       " font-size: 9pt !important;\n",
-       " z-index: 0;\n",
-       " margin-top: -5px !important;\n",
-       "}\n",
-       "#modal_indicator {\n",
-       " float: right !important;\n",
-       " color: #4c8be2;\n",
-       " background: #1a2028;\n",
-       " background-color: #1a2028;\n",
-       " margin-top: 8px !important;\n",
-       " margin-left: 0px;\n",
-       "}\n",
-       "#kernel_indicator {\n",
-       " float: right !important;\n",
-       " color: #0b98c8;\n",
-       " background: #1a2028;\n",
-       " background-color: #1a2028;\n",
-       " border-left: 2px solid #0b98c8;\n",
-       " padding-top: 0px;\n",
-       " padding-bottom: 4px;\n",
-       " margin-top: 10px !important;\n",
-       " margin-left: -2px;\n",
-       " padding-left: 5px !important;\n",
-       "}\n",
-       "#kernel_indicator .kernel_indicator_name {\n",
-       " font-size: 17px;\n",
-       " color: #0b98c8;\n",
-       " background: #1a2028;\n",
-       " background-color: #1a2028;\n",
-       " padding-left: 5px;\n",
-       " padding-right: 5px;\n",
-       " margin-top: 4px;\n",
-       " vertical-align: text-top;\n",
-       " padding-bottom: 0px;\n",
-       "}\n",
-       ".kernel_idle_icon:before {\n",
-       " display: inline-block;\n",
-       " font: normal normal normal 22px/1 FontAwesome;\n",
-       " font-size: 22px;\n",
-       " text-rendering: auto;\n",
-       " -webkit-font-smoothing: antialiased;\n",
-       " cursor: pointer;\n",
-       " margin-left: 0px !important;\n",
-       " opacity: 0.7;\n",
-       " vertical-align: bottom;\n",
-       " margin-top: 1px;\n",
-       " content: \"\\f1db\";\n",
-       "}\n",
-       ".kernel_busy_icon:before {\n",
-       " display: inline-block;\n",
-       " font: normal normal normal 22px/1 FontAwesome;\n",
-       " font-size: 22px;\n",
-       " -webkit-animation: pulsate 2s infinite ease-out;\n",
-       " animation: pulsate 2s infinite ease-out;\n",
-       " text-rendering: auto;\n",
-       " -webkit-font-smoothing: antialiased;\n",
-       " cursor: pointer;\n",
-       " margin-left: 0px !important;\n",
-       " vertical-align: bottom;\n",
-       " margin-top: 1px;\n",
-       " content: \"\\f111\";\n",
-       "}\n",
-       "@-webkit-keyframes pulsate {\n",
-       " 0% {\n",
-       "  -webkit-transform: scale(1.0,1.0);\n",
-       "  opacity: 0.8;\n",
-       " }\n",
-       " 8% {\n",
-       "  -webkit-transform: scale(1.0,1.0);\n",
-       "  opacity: 0.8;\n",
-       " }\n",
-       " 50% {\n",
-       "  -webkit-transform: scale(0.75,0.75);\n",
-       "  opacity: 0.3;\n",
-       " }\n",
-       " 92% {\n",
-       "  -webkit-transform: scale(1.0,1.0);\n",
-       "  opacity: 0.8;\n",
-       " }\n",
-       " 100% {\n",
-       "  -webkit-transform: scale(1.0,1.0);\n",
-       "  opacity: 0.8;\n",
-       " }\n",
-       "}\n",
-       "div.notification_widget.info,\n",
-       ".notification_widget.info,\n",
-       ".notification_widget:active:hover,\n",
-       ".notification_widget.active:hover,\n",
-       ".open > .dropdown-toggle.notification_widget:hover,\n",
-       ".notification_widget:active:focus,\n",
-       ".notification_widget.active:focus,\n",
-       ".open > .dropdown-toggle.notification_widget:focus,\n",
-       ".notification_widget:active.focus,\n",
-       ".notification_widget.active.focus,\n",
-       ".open > .dropdown-toggle.notification_widget.focus,\n",
-       "div#notification_notebook.notification_widget.btn.btn-xs.navbar-btn,\n",
-       "div#notification_notebook.notification_widget.btn.btn-xs.navbar-btn:hover,\n",
-       "div#notification_notebook.notification_widget.btn.btn-xs.navbar-btn:focus {\n",
-       " color: #899ab8;\n",
-       " background-color: #1a2028;\n",
-       " border-color: #1a2028;\n",
-       "}\n",
-       "#notification_area,\n",
-       "div.notification_area {\n",
-       " float: right !important;\n",
-       " position: static;\n",
-       "}\n",
-       ".notification_widget,\n",
-       "div.notification_widget {\n",
-       " margin-right: 0px;\n",
-       " margin-left: 0px;\n",
-       " padding-right: 0px;\n",
-       " vertical-align: text-top !important;\n",
-       " margin-top: 6px !important;\n",
-       " z-index: 1000;\n",
-       "}\n",
-       "#kernel_logo_widget,\n",
-       "#kernel_logo_widget .current_kernel_logo {\n",
-       " display: none;\n",
-       "}\n",
-       "div#ipython_notebook {\n",
-       " display: none;\n",
-       "}\n",
-       "i.fa.fa-icon {\n",
-       " -webkit-font-smoothing: antialiased;\n",
-       " -moz-osx-font-smoothing: grayscale;\n",
-       " text-rendering: auto;\n",
-       "}\n",
-       ".fa {\n",
-       " display: inline-block;\n",
-       " font: normal normal normal 10pt/1 \"FontAwesome\", sans-serif;\n",
-       " text-rendering: auto;\n",
-       " -webkit-font-smoothing: antialiased;\n",
-       " -moz-osx-font-smoothing: grayscale;\n",
-       "}\n",
-       ".dropdown-menu {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " box-shadow: none;\n",
-       " padding: 0px;\n",
-       " text-align: left;\n",
-       " border: none;\n",
-       " background-color: #36404e;\n",
-       " background: #36404e;\n",
-       " line-height: 1;\n",
-       "}\n",
-       ".dropdown-menu:hover {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " box-shadow: none;\n",
-       " padding: 0px;\n",
-       " text-align: left;\n",
-       " border: none;\n",
-       " background-color: #36404e;\n",
-       " box-shadow: none;\n",
-       " line-height: 1;\n",
-       "}\n",
-       ".dropdown-menu > li > a {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 12.0pt;\n",
-       " display: block;\n",
-       " padding: 10px 20px 9px 10px;\n",
-       " color: #a2b0c7;\n",
-       " background-color: #36404e;\n",
-       " background: #36404e;\n",
-       "}\n",
-       ".dropdown-menu > li > a:hover,\n",
-       ".dropdown-menu > li > a:focus {\n",
-       " color: #dbe1ea;\n",
-       " background-color: #323b48;\n",
-       " background: #323b48;\n",
-       " border-color: #323b48;\n",
-       " transition: 200ms ease;\n",
-       "}\n",
-       ".dropdown-menu .divider {\n",
-       " height: 1px;\n",
-       " margin: 0px 0px;\n",
-       " overflow: hidden;\n",
-       " background-color: rgba(75,95,118,.55);\n",
-       "}\n",
-       ".dropdown-submenu > .dropdown-menu {\n",
-       " display: none;\n",
-       " top: 2px !important;\n",
-       " left: 100%;\n",
-       " margin-top: -2px;\n",
-       " margin-left: 0px;\n",
-       " padding-top: 0px;\n",
-       " transition: 200ms ease;\n",
-       "}\n",
-       ".dropdown-menu > .disabled > a,\n",
-       ".dropdown-menu > .disabled > a:hover,\n",
-       ".dropdown-menu > .disabled > a:focus {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 12.0pt;\n",
-       " font-weight: normal;\n",
-       " color: #546386;\n",
-       " padding: none;\n",
-       " display: block;\n",
-       " clear: both;\n",
-       " white-space: nowrap;\n",
-       "}\n",
-       ".dropdown-submenu > a:after {\n",
-       " color: #a2b0c7;\n",
-       " margin-right: -16px;\n",
-       " margin-top: 0px;\n",
-       " display: inline-block;\n",
-       "}\n",
-       ".dropdown-submenu:hover > a:after,\n",
-       ".dropdown-submenu:active > a:after,\n",
-       ".dropdown-submenu:focus > a:after,\n",
-       ".dropdown-submenu:visited > a:after {\n",
-       " color: #0b98c8;\n",
-       " margin-right: -16px;\n",
-       " display: inline-block !important;\n",
-       "}\n",
-       "div.kse-dropdown > .dropdown-menu,\n",
-       ".kse-dropdown > .dropdown-menu {\n",
-       " min-width: 0;\n",
-       " top: 94%;\n",
-       "}\n",
-       ".btn,\n",
-       ".btn-default {\n",
-       " font-family: sans-serif;\n",
-       " color: #a2b0c7;\n",
-       " background: #252e3a;\n",
-       " background-color: #252e3a;\n",
-       " border: 2px solid #252e3a;\n",
-       " font-weight: normal;\n",
-       " box-shadow: none;\n",
-       " text-shadow: none;\n",
-       " border-radius: 3px;\n",
-       " font-size: initial;\n",
-       "}\n",
-       ".btn:hover,\n",
-       ".btn:active:hover,\n",
-       ".btn.active:hover,\n",
-       ".btn-default:hover,\n",
-       ".open > .dropdown-toggle.btn-default:hover,\n",
-       ".open > .dropdown-toggle.btn:hover {\n",
-       " color: #009cd1;\n",
-       " border: 2px solid #293340;\n",
-       " background-color: #293340;\n",
-       " background: #293340;\n",
-       " background-image: none;\n",
-       " box-shadow: none !important;\n",
-       " border-radius: 3px;\n",
-       "}\n",
-       ".btn:active,\n",
-       ".btn.active,\n",
-       ".btn:active:focus,\n",
-       ".btn.active:focus,\n",
-       ".btn:active.focus,\n",
-       ".btn.active.focus,\n",
-       ".btn-default:focus,\n",
-       ".btn-default.focus,\n",
-       ".btn-default:active,\n",
-       ".btn-default.active,\n",
-       ".btn-default:active:hover,\n",
-       ".btn-default.active:hover,\n",
-       ".btn-default:active:focus,\n",
-       ".btn-default.active:focus,\n",
-       ".btn-default:active.focus,\n",
-       ".btn-default.active.focus,\n",
-       ".open > .dropdown-toggle.btn:focus,\n",
-       ".open > .dropdown-toggle.btn.focus,\n",
-       ".open > .dropdown-toggle.btn-default:hover,\n",
-       ".open > .dropdown-toggle.btn-default:focus,\n",
-       ".open > .dropdown-toggle.btn-default.hover,\n",
-       ".open > .dropdown-toggle.btn-default.focus {\n",
-       " color: #009cd1;\n",
-       " border: 2px solid #293340;\n",
-       " background-color: #293340 !important;\n",
-       " background: #293340 !important;\n",
-       " background-image: none;\n",
-       " box-shadow: none !important;\n",
-       " border-radius: 3px;\n",
-       "}\n",
-       ".btn-default:active:hover,\n",
-       ".btn-default.active:hover,\n",
-       ".btn-default:active:focus,\n",
-       ".btn-default.active:focus,\n",
-       ".btn-default:active.focus,\n",
-       ".btn-default.active.focus {\n",
-       " color: #009cd1 !important;\n",
-       " background-color: #252e3a;\n",
-       " border-color: #33517c !important;\n",
-       " transition: 2000ms ease;\n",
-       "}\n",
-       ".btn:focus,\n",
-       ".btn.focus,\n",
-       ".btn:active:focus,\n",
-       ".btn.active:focus,\n",
-       ".btn:active,\n",
-       ".btn.active,\n",
-       ".btn:active.focus,\n",
-       ".btn.active.focus {\n",
-       " color: #009cd1 !important;\n",
-       " outline: none !important;\n",
-       " outline-width: 0px !important;\n",
-       " background: #33517c !important;\n",
-       " background-color: #33517c !important;\n",
-       " border-color: #33517c !important;\n",
-       " transition: 200ms ease !important;\n",
-       "}\n",
-       ".item_buttons > .btn,\n",
-       ".item_buttons > .btn-group,\n",
-       ".item_buttons > .input-group {\n",
-       " font-size: 13pt;\n",
-       " background: transparent;\n",
-       " background-color: transparent;\n",
-       " border: 0px solid #252b35;\n",
-       " border-bottom: 2px solid transparent;\n",
-       " margin-left: 5px;\n",
-       " padding-top: 4px !important;\n",
-       "}\n",
-       ".item_buttons > .btn:hover,\n",
-       ".item_buttons > .btn-group:hover,\n",
-       ".item_buttons > .input-group:hover,\n",
-       ".item_buttons > .btn.active,\n",
-       ".item_buttons > .btn-group.active,\n",
-       ".item_buttons > .input-group.active,\n",
-       ".item_buttons > .btn.focus {\n",
-       " margin-left: 5px;\n",
-       " background: #21262f;\n",
-       " padding-top: 4px !important;\n",
-       " background-color: transparent;\n",
-       " border: 0px solid transparent;\n",
-       " border-bottom: 2px solid #0b98c8;\n",
-       " border-radius: 0px;\n",
-       " transition: none;\n",
-       "}\n",
-       ".item_buttons {\n",
-       " line-height: 1.5em !important;\n",
-       "}\n",
-       ".item_buttons .btn {\n",
-       " min-width: 11ex;\n",
-       "}\n",
-       ".btn-group > .btn:first-child {\n",
-       " margin-left: 3px;\n",
-       "}\n",
-       ".btn-group > .btn-mini,\n",
-       ".btn-sm,\n",
-       ".btn-group-sm > .btn,\n",
-       ".btn-xs,\n",
-       ".btn-group-xs > .btn,\n",
-       ".alternate_upload .btn-upload,\n",
-       ".btn-group,\n",
-       ".btn-group-vertical {\n",
-       " font-size: inherit;\n",
-       " font-weight: normal;\n",
-       " height: inherit;\n",
-       " line-height: inherit;\n",
-       "}\n",
-       ".btn-xs,\n",
-       ".btn-group-xs > .btn {\n",
-       " font-size: initial !important;\n",
-       " background-image: none;\n",
-       " font-weight: normal;\n",
-       " text-shadow: none;\n",
-       " display: inline-table;\n",
-       " padding: 2px 5px;\n",
-       " line-height: 1.45;\n",
-       "}\n",
-       ".btn-group > .btn:first-child {\n",
-       " margin-left: 3px;\n",
-       "}\n",
-       "div#new-buttons > button,\n",
-       "#new-buttons > button,\n",
-       "div#refresh_notebook_list,\n",
-       "#refresh_notebook_list {\n",
-       " background: transparent;\n",
-       " background-color: transparent;\n",
-       " border: none;\n",
-       "}\n",
-       "div#new-buttons > button:hover,\n",
-       "#new-buttons > button:hover,\n",
-       "div#refresh_notebook_list,\n",
-       "#refresh_notebook_list,\n",
-       "div.alternate_upload .btn-upload,\n",
-       ".alternate_upload .btn-upload,\n",
-       "div.dynamic-buttons > button,\n",
-       ".dynamic-buttons > button,\n",
-       ".dynamic-buttons > button:focus,\n",
-       ".dynamic-buttons > button:active:focus,\n",
-       ".dynamic-buttons > button.active:focus,\n",
-       ".dynamic-buttons > button.focus,\n",
-       ".dynamic-buttons > button:active.focus,\n",
-       ".dynamic-buttons > button.active.focus,\n",
-       "#new-buttons > button:focus,\n",
-       "#new-buttons > button:active:focus,\n",
-       "#new-buttons > button.active:focus,\n",
-       "#new-buttons > button.focus,\n",
-       "#new-buttons > button:active.focus,\n",
-       "#new-buttons > button.active.focus,\n",
-       ".alternate_upload .btn-upload:focus,\n",
-       ".alternate_upload .btn-upload:active:focus,\n",
-       ".alternate_upload .btn-upload.active:focus,\n",
-       ".alternate_upload .btn-upload.focus,\n",
-       ".alternate_upload .btn-upload:active.focus,\n",
-       ".alternate_upload .btn-upload.active.focus {\n",
-       " background: transparent !important;\n",
-       " background-color: transparent !important;\n",
-       " border: none !important;\n",
-       "}\n",
-       ".alternate_upload input.fileinput {\n",
-       " text-align: center;\n",
-       " vertical-align: bottom;\n",
-       " margin-left: -.5ex;\n",
-       " display: inline-table;\n",
-       " border: solid 0px #252e3a;\n",
-       " margin-bottom: -1ex;\n",
-       "}\n",
-       ".alternate_upload .btn-upload {\n",
-       " display: inline-table;\n",
-       " background: transparent;\n",
-       " border: none;\n",
-       "}\n",
-       ".btn-group .btn + .btn,\n",
-       ".btn-group .btn + .btn-group,\n",
-       ".btn-group .btn-group + .btn,\n",
-       ".btn-group .btn-group + .btn-group {\n",
-       " margin-left: -2px;\n",
-       "}\n",
-       ".btn-group > .btn:first-child:not(:last-child):not(.dropdown-toggle) {\n",
-       " border-bottom-right-radius: 0;\n",
-       " border-top-right-radius: 0;\n",
-       " z-index: 2;\n",
-       "}\n",
-       ".dropdown-header {\n",
-       " font-family: sans-serif !important;\n",
-       " font-size: 13pt !important;\n",
-       " color: #0b98c8 !important;\n",
-       " border-bottom: none !important;\n",
-       " padding: 0px !important;\n",
-       " margin: 6px 6px 0px !important;\n",
-       "}\n",
-       "span#last-modified.btn.btn-xs.btn-default.sort-action,\n",
-       "span#sort-name.btn.btn-xs.btn-default.sort-action,\n",
-       "span#file-size.btn.btn-xs.btn-default.sort-action {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 16px;\n",
-       " background-color: transparent;\n",
-       " background: transparent;\n",
-       " border: none;\n",
-       " color: #a2b0c7;\n",
-       " padding-bottom: 0px;\n",
-       " margin-bottom: 0px;\n",
-       " vertical-align: sub;\n",
-       "}\n",
-       "span#last-modified.btn.btn-xs.btn-default.sort-action {\n",
-       " margin-left: 19px;\n",
-       "}\n",
-       "button.close {\n",
-       " border: 0px none;\n",
-       " font-family: sans-serif;\n",
-       " font-size: 20pt;\n",
-       " font-weight: normal;\n",
-       "}\n",
-       ".dynamic-buttons {\n",
-       " padding-top: 0px;\n",
-       " display: inline-block;\n",
-       "}\n",
-       ".close {\n",
-       " color: #dc6972;\n",
-       " opacity: .5;\n",
-       " text-shadow: none;\n",
-       " font-weight: normal;\n",
-       "}\n",
-       ".close:hover {\n",
-       " color: #dc6972;\n",
-       " opacity: 1;\n",
-       " font-weight: normal;\n",
-       "}\n",
-       "div.nbext-enable-btns .btn[disabled],\n",
-       "div.nbext-enable-btns .btn[disabled]:hover,\n",
-       ".btn-default.disabled,\n",
-       ".btn-default[disabled],\n",
-       ".btn-default.disabled:hover,\n",
-       ".btn-default[disabled]:hover,\n",
-       "fieldset[disabled] .btn-default:hover,\n",
-       ".btn-default.disabled:focus,\n",
-       ".btn-default[disabled]:focus,\n",
-       "fieldset[disabled] .btn-default:focus,\n",
-       ".btn-default.disabled.focus,\n",
-       ".btn-default[disabled].focus,\n",
-       "fieldset[disabled] .btn-default.focus {\n",
-       " color: #92a2bd;\n",
-       " background: #232c37;\n",
-       " background-color: #232c37;\n",
-       " border-color: #232c37;\n",
-       " transition: 200ms ease;\n",
-       "}\n",
-       ".input-group-addon {\n",
-       " padding: 2px 5px;\n",
-       " font-size: 13pt;\n",
-       " font-weight: normal;\n",
-       " height: auto;\n",
-       " color: #a2b0c7;\n",
-       " text-align: center;\n",
-       " background-color: transparent;\n",
-       " border: 2px solid transparent !important;\n",
-       " text-transform: capitalize;\n",
-       "}\n",
-       "a.btn.btn-default.input-group-addon:hover {\n",
-       " background: transparent !important;\n",
-       " background-color: transparent !important;\n",
-       "}\n",
-       ".btn-group > .btn + .dropdown-toggle {\n",
-       " padding-left: 8px;\n",
-       " padding-right: 8px;\n",
-       " height: 100%;\n",
-       "}\n",
-       ".btn-group > .btn + .dropdown-toggle:hover {\n",
-       " background: #293340 !important;\n",
-       "}\n",
-       ".input-group-btn {\n",
-       " position: relative;\n",
-       " font-size: inherit;\n",
-       " white-space: nowrap;\n",
-       " background: #252b35;\n",
-       " background-color: #252b35;\n",
-       " border: none;\n",
-       "}\n",
-       ".input-group-btn:hover {\n",
-       " background: #21262f;\n",
-       " background-color: #21262f;\n",
-       " border: none;\n",
-       "}\n",
-       ".input-group-btn:first-child > .btn,\n",
-       ".input-group-btn:first-child > .btn-group {\n",
-       " background: #252b35;\n",
-       " background-color: #252b35;\n",
-       " border: none;\n",
-       " margin-left: 2px;\n",
-       " margin-right: -1px;\n",
-       " font-size: inherit;\n",
-       "}\n",
-       ".input-group-btn:first-child > .btn:hover,\n",
-       ".input-group-btn:first-child > .btn-group:hover {\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       " border: none;\n",
-       " font-size: inherit;\n",
-       " transition: 200ms ease;\n",
-       "}\n",
-       "div.modal .btn-group > .btn:first-child {\n",
-       " background: #252b35;\n",
-       " background-color: #252b35;\n",
-       " border: 1px solid #232932;\n",
-       " margin-top: 0px !important;\n",
-       " margin-left: 0px;\n",
-       " margin-bottom: 2px;\n",
-       "}\n",
-       "div.modal .btn-group > .btn:first-child:hover {\n",
-       " background: #21262f;\n",
-       " background-color: #21262f;\n",
-       " border: 1px solid #21262f;\n",
-       " transition: 200ms ease;\n",
-       "}\n",
-       "div.modal > button,\n",
-       "div.modal-footer > button {\n",
-       " background: #252b35;\n",
-       " background-color: #252b35;\n",
-       " border-color: #252b35;\n",
-       "}\n",
-       "div.modal > button:hover,\n",
-       "div.modal-footer > button:hover {\n",
-       " background: #21262f;\n",
-       " background-color: #21262f;\n",
-       " border-color: #21262f;\n",
-       " transition: 200ms ease;\n",
-       "}\n",
-       ".modal-content {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 12.0pt;\n",
-       " position: relative;\n",
-       " background: #252b35;\n",
-       " background-color: #252b35;\n",
-       " border: none;\n",
-       " border-radius: 1px;\n",
-       " background-clip: padding-box;\n",
-       " outline: none;\n",
-       "}\n",
-       ".modal-header {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " color: #a2b0c7;\n",
-       " background: #252b35;\n",
-       " background-color: #252b35;\n",
-       " border-color: rgba(75,95,118,.30);\n",
-       " padding: 12px;\n",
-       " min-height: 16.4286px;\n",
-       "}\n",
-       ".modal-content h4 {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 16pt;\n",
-       " color: #a2b0c7;\n",
-       " padding: 5px;\n",
-       "}\n",
-       ".modal-body {\n",
-       " background-color: #2d3846;\n",
-       " position: relative;\n",
-       " padding: 15px;\n",
-       "}\n",
-       ".modal-footer {\n",
-       " padding: 8px;\n",
-       " text-align: right;\n",
-       " background-color: #2d3846;\n",
-       " border-top: none;\n",
-       "}\n",
-       ".alert-info {\n",
-       " background-color: #323f50;\n",
-       " border-color: rgba(75,95,118,.30);\n",
-       " color: #a2b0c7;\n",
-       "}\n",
-       ".modal-header .close {\n",
-       " margin-top: -5px;\n",
-       " font-size: 25pt;\n",
-       "}\n",
-       ".modal-backdrop,\n",
-       ".modal-backdrop.in {\n",
-       " opacity: 0.85;\n",
-       " background-color: notebook-bg;\n",
-       "}\n",
-       "div.panel,\n",
-       "div.panel-default,\n",
-       ".panel,\n",
-       ".panel-default {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " background-color: #2d3846;\n",
-       " color: #a2b0c7;\n",
-       " margin-bottom: 14px;\n",
-       " border: 0;\n",
-       " box-shadow: none;\n",
-       "}\n",
-       "div.panel > .panel-heading,\n",
-       "div.panel-default > .panel-heading {\n",
-       " font-size: 14pt;\n",
-       " color: #a2b0c7;\n",
-       " background: #252b35;\n",
-       " background-color: #252b35;\n",
-       " border: 0;\n",
-       "}\n",
-       ".modal .modal-dialog {\n",
-       " min-width: 950px;\n",
-       " margin: 50px auto;\n",
-       "}\n",
-       "div.container-fluid {\n",
-       " margin-right: auto;\n",
-       " margin-left: auto;\n",
-       " padding-left: 0px;\n",
-       " padding-right: 5px;\n",
-       "}\n",
-       "div.form-control,\n",
-       ".form-control {\n",
-       " font-family: sans-serif;\n",
-       " font-size: initial;\n",
-       " color: #a2b0c7;\n",
-       " background-color: #252b35;\n",
-       " border: 1px solid #252e3a !important;\n",
-       " margin-left: 2px;\n",
-       " box-shadow: none;\n",
-       " transition: border-color 0.15s ease-in-out 0s, box-shadow 0.15s ease-in-out 0s;\n",
-       "}\n",
-       ".form-control-static {\n",
-       " min-height: inherit;\n",
-       " height: inherit;\n",
-       "}\n",
-       ".form-group.list-group-item {\n",
-       " color: #a2b0c7;\n",
-       " background-color: #2d3846;\n",
-       " border-color: rgba(75,95,118,.30);\n",
-       " margin-bottom: 0px;\n",
-       "}\n",
-       ".form-group .input-group {\n",
-       " float: left;\n",
-       "}\n",
-       "input,\n",
-       "button,\n",
-       "select,\n",
-       "textarea {\n",
-       " background-color: #252b35;\n",
-       " font-weight: normal;\n",
-       " border: 1px solid rgba(75,95,118,.30);\n",
-       "}\n",
-       "select.form-control.select-xs {\n",
-       " height: 33px;\n",
-       " font-size: 13pt;\n",
-       "}\n",
-       ".toolbar select,\n",
-       ".toolbar label {\n",
-       " width: auto;\n",
-       " vertical-align: middle;\n",
-       " margin-right: 0px;\n",
-       " margin-bottom: 0px;\n",
-       " display: inline;\n",
-       " font-size: 92%;\n",
-       " margin-left: 10px;\n",
-       " padding: 0px;\n",
-       " background: #252e3a !important;\n",
-       " background-color: #252e3a !important;\n",
-       " border: 2px solid #212934 !important;\n",
-       "}\n",
-       ".form-control:focus {\n",
-       " border-color: #0b98c8;\n",
-       " outline: 2px solid rgba(0,156,209,.5);\n",
-       " -webkit-box-shadow: none;\n",
-       "}\n",
-       "::-webkit-input-placeholder {\n",
-       " color: #546386;\n",
-       "}\n",
-       "::-moz-placeholder {\n",
-       " color: #546386;\n",
-       "}\n",
-       ":-ms-input-placeholder {\n",
-       " color: #546386;\n",
-       "}\n",
-       ":-moz-placeholder {\n",
-       " color: #546386;\n",
-       "}\n",
-       "[dir=\"ltr\"] #find-and-replace .input-group-btn + .form-control {\n",
-       " border: 2px solid rgba(75,95,118,.30) !important;\n",
-       "}\n",
-       "[dir=\"ltr\"] #find-and-replace .input-group-btn + .form-control:focus {\n",
-       " border-color: #0b98c8;\n",
-       " outline: 2px solid rgba(0,156,209,.5);\n",
-       " -webkit-box-shadow: none;\n",
-       " box-shadow: none;\n",
-       "}\n",
-       "div.output.output_scroll {\n",
-       " box-shadow: none;\n",
-       "}\n",
-       "::-webkit-scrollbar {\n",
-       " width: 11px;\n",
-       " max-height: 9px;\n",
-       " background-color: #292d3a;\n",
-       " border-radius: 3px;\n",
-       " border: none;\n",
-       "}\n",
-       "::-webkit-scrollbar-track {\n",
-       " background: #292d3a;\n",
-       " border: none;\n",
-       " width: 11px;\n",
-       " max-height: 9px;\n",
-       "}\n",
-       "::-webkit-scrollbar-thumb {\n",
-       " border-radius: 2px;\n",
-       " border: none;\n",
-       " background: #3f4555;\n",
-       " background-clip: content-box;\n",
-       " width: 11px;\n",
-       "}\n",
-       "HTML,\n",
-       "body,\n",
-       "div,\n",
-       "dl,\n",
-       "dt,\n",
-       "dd,\n",
-       "ul,\n",
-       "ol,\n",
-       "li,\n",
-       "h1,\n",
-       "h2,\n",
-       "h3,\n",
-       "h4,\n",
-       "h5,\n",
-       "h6,\n",
-       "pre,\n",
-       "code,\n",
-       "form,\n",
-       "fieldset,\n",
-       "legend,\n",
-       "input,\n",
-       "button,\n",
-       "textarea,\n",
-       "p,\n",
-       "blockquote,\n",
-       "th,\n",
-       "td,\n",
-       "span,\n",
-       "a {\n",
-       " text-rendering: geometricPrecision;\n",
-       " -webkit-font-smoothing: subpixel-antialiased;\n",
-       " font-weight: 400;\n",
-       "}\n",
-       "div.input_area {\n",
-       " background-color: #293340;\n",
-       " background: #293340;\n",
-       " padding-right: 1.2em;\n",
-       " border: 0px;\n",
-       " border-radius: 0px;\n",
-       " border-top-right-radius: 4px;\n",
-       " border-bottom-right-radius: 4px;\n",
-       "}\n",
-       "div.cell {\n",
-       " padding: 0px;\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       " border: medium solid #1a2028;\n",
-       " border-radius: 4px;\n",
-       " top: 0;\n",
-       "}\n",
-       "div.cell.selected {\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       " border: medium solid #1a2028;\n",
-       " padding: 0px;\n",
-       " border-radius: 5px;\n",
-       "}\n",
-       ".edit_mode div.cell.selected {\n",
-       " padding: 0px;\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       " border: medium solid #1a2028;\n",
-       " border-radius: 5px;\n",
-       "}\n",
-       "div.cell.edit_mode {\n",
-       " padding: 0px;\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       "}\n",
-       "div.CodeMirror-sizer {\n",
-       " margin-left: 0px;\n",
-       " margin-bottom: -21px;\n",
-       " border-right-width: 16px;\n",
-       " min-height: 37px;\n",
-       " padding-right: 0px;\n",
-       " padding-bottom: 0px;\n",
-       " margin-top: 0px;\n",
-       "}\n",
-       "div.cell.selected:before,\n",
-       ".edit_mode div.cell.selected:before,\n",
-       "div.cell.selected:before,\n",
-       "div.cell.selected.jupyter-soft-selected:before {\n",
-       " background: #293340 !important;\n",
-       " border: none;\n",
-       " border-radius: 3px;\n",
-       " position: absolute;\n",
-       " display: block;\n",
-       " top: 0px;\n",
-       " left: 0px;\n",
-       " width: 0px;\n",
-       " height: 100%;\n",
-       "}\n",
-       "div.cell.text_cell.selected::before,\n",
-       ".edit_mode div.cell.text_cell.selected:before,\n",
-       "div.cell.text_cell.selected:before,\n",
-       "div.cell.text_cell.selected.jupyter-soft-selected:before {\n",
-       " background: #293340 !important;\n",
-       " background-color: #293340 !important;\n",
-       " border-color: #0b98c8 !important;\n",
-       "}\n",
-       "div.cell.code_cell .input {\n",
-       " border-left: 5px solid #293340 !important;\n",
-       " border-radius: 3px;\n",
-       " border-bottom-left-radius: 3px;\n",
-       " border-top-left-radius: 3px;\n",
-       "}\n",
-       "div.cell.code_cell.selected .input {\n",
-       " border-left: 5px solid #008ebf !important;\n",
-       " border-radius: 3px;\n",
-       "}\n",
-       ".edit_mode div.cell.code_cell.selected .input {\n",
-       " border-left: 5px solid #005573 !important;\n",
-       " border-radius: 3px;\n",
-       "}\n",
-       ".edit_mode div.cell.selected:before {\n",
-       " height: 100%;\n",
-       " border-left: 5px solid #005573 !important;\n",
-       " border-radius: 3px;\n",
-       "}\n",
-       "div.cell.jupyter-soft-selected,\n",
-       "div.cell.selected.jupyter-soft-selected {\n",
-       " border-left-color: #005573 !important;\n",
-       " border-left-width: 0px !important;\n",
-       " padding-left: 7px !important;\n",
-       " border-right-color: #005573 !important;\n",
-       " border-right-width: 0px !important;\n",
-       " background: #005573 !important;\n",
-       " border-radius: 6px !important;\n",
-       "}\n",
-       "div.cell.selected.jupyter-soft-selected .input {\n",
-       " border-left: 5px solid #293340 !important;\n",
-       "}\n",
-       "div.cell.selected.jupyter-soft-selected {\n",
-       " border-left-color: #008ebf;\n",
-       " border-color: #1a2028;\n",
-       " padding-left: 7px;\n",
-       " border-radius: 6px;\n",
-       "}\n",
-       "div.cell.code_cell.selected .input {\n",
-       " border-left: none;\n",
-       " border-radius: 3px;\n",
-       "}\n",
-       "div.cell.selected.jupyter-soft-selected .prompt,\n",
-       "div.cell.text_cell.selected.jupyter-soft-selected .prompt {\n",
-       " top: 0;\n",
-       " border-left: #293340 !important;\n",
-       " border-radius: 2px;\n",
-       "}\n",
-       "div.cell.text_cell.selected.jupyter-soft-selected .input_prompt {\n",
-       " border-left: none !important;\n",
-       "}\n",
-       "div.cell.text_cell.jupyter-soft-selected,\n",
-       "div.cell.text_cell.selected.jupyter-soft-selected {\n",
-       " border-left-color: #005573 !important;\n",
-       " border-left-width: 0px !important;\n",
-       " padding-left: 26px !important;\n",
-       " border-right-color: #005573 !important;\n",
-       " border-right-width: 0px !important;\n",
-       " background: #005573 !important;\n",
-       " border-radius: 5px !important;\n",
-       "}\n",
-       "div.cell.jupyter-soft-selected .input,\n",
-       "div.cell.selected.jupyter-soft-selected .input {\n",
-       " border-left-color: #005573 !important;\n",
-       "}\n",
-       "div.prompt,\n",
-       ".prompt {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 9pt !important;\n",
-       " font-weight: normal;\n",
-       " color: #546386;\n",
-       " line-height: 170%;\n",
-       " padding: 0px;\n",
-       " padding-top: 4px;\n",
-       " padding-left: 0px;\n",
-       " padding-right: 1px;\n",
-       " text-align: right !important;\n",
-       " min-width: 11.5ex !important;\n",
-       " width: 11.5ex !important;\n",
-       "}\n",
-       "div.prompt.input_prompt {\n",
-       " font-size: 9pt !important;\n",
-       " background-color: #293340;\n",
-       " border-top: 0px;\n",
-       " border-top-right-radius: 0px;\n",
-       " border-bottom-left-radius: 0px;\n",
-       " border-bottom-right-radius: 0px;\n",
-       " padding-right: 3px;\n",
-       " min-width: 11.5ex;\n",
-       " width: 11.5ex !important;\n",
-       "}\n",
-       "div.cell.code_cell .input_prompt {\n",
-       " border-right: 2px solid rgba(0,156,209,.5);\n",
-       "}\n",
-       "div.cell.selected .prompt {\n",
-       " top: 0;\n",
-       "}\n",
-       ".edit_mode div.cell.selected .prompt {\n",
-       " top: 0;\n",
-       "}\n",
-       ".edit_mode div.cell.selected .prompt {\n",
-       " top: 0;\n",
-       "}\n",
-       ".run_this_cell {\n",
-       " visibility: hidden;\n",
-       " color: transparent;\n",
-       " padding-top: 0px;\n",
-       " padding-bottom: 0px;\n",
-       " padding-left: 3px;\n",
-       " padding-right: 12px;\n",
-       " width: 1.5ex;\n",
-       " width: 0ex;\n",
-       " background: transparent;\n",
-       " background-color: transparent;\n",
-       "}\n",
-       "div.code_cell:hover div.input .run_this_cell {\n",
-       " visibility: visible;\n",
-       "}\n",
-       "div.cell.code_cell.rendered.selected .run_this_cell:hover {\n",
-       " background-color: #212934;\n",
-       " background: #212934;\n",
-       " color: #008ebf !important;\n",
-       "}\n",
-       "div.cell.code_cell.rendered.unselected .run_this_cell:hover {\n",
-       " background-color: #212934;\n",
-       " background: #212934;\n",
-       " color: #008ebf !important;\n",
-       "}\n",
-       "i.fa-step-forward.fa {\n",
-       " display: inline-block;\n",
-       " font: normal normal normal 9px \"FontAwesome\";\n",
-       "}\n",
-       ".fa-step-forward:before {\n",
-       " content: \"\\f04b\";\n",
-       "}\n",
-       "div.cell.selected.jupyter-soft-selected .run_this_cell,\n",
-       "div.cell.selected.jupyter-soft-selected .run_this_cell:hover,\n",
-       "div.cell.unselected.jupyter-soft-selected .run_this_cell:hover,\n",
-       "div.cell.code_cell.rendered.selected.jupyter-soft-selected .run_this_cell:hover,\n",
-       "div.cell.code_cell.rendered.unselected.jupyter-soft-selected .run_this_cell:hover {\n",
-       " background-color: #005573 !important;\n",
-       " background: #005573 !important;\n",
-       " color: #005573 !important;\n",
-       "}\n",
-       "div.output_wrapper {\n",
-       " background-color: #323a48;\n",
-       " border: 0px;\n",
-       " left: 0px;\n",
-       " margin-bottom: 0em;\n",
-       " margin-top: 0em;\n",
-       " border-top-right-radius: 0px;\n",
-       " border-top-left-radius: 0px;\n",
-       "}\n",
-       "div.output_subarea.output_text.output_stream.output_stdout,\n",
-       "div.output_subarea.output_text {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 8.5pt !important;\n",
-       " line-height: 150% !important;\n",
-       " background-color: #323a48;\n",
-       " color: #b4bcde;\n",
-       " border-top-right-radius: 0px;\n",
-       " border-top-left-radius: 0px;\n",
-       " margin-left: 11.5px;\n",
-       "}\n",
-       "div.output_area pre {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 8.5pt !important;\n",
-       " line-height: 151% !important;\n",
-       " color: #b4bcde;\n",
-       " border-top-right-radius: 0px;\n",
-       " border-top-left-radius: 0px;\n",
-       "}\n",
-       "div.output_area {\n",
-       " display: -webkit-box;\n",
-       "}\n",
-       "div.output_html {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 8.5pt;\n",
-       " color: #e2e5f2;\n",
-       " background-color: #323a48;\n",
-       " background: #323a48;\n",
-       "}\n",
-       "div.output_subarea {\n",
-       " overflow-x: auto;\n",
-       " padding: 1.2em !important;\n",
-       " -webkit-box-flex: 1;\n",
-       " -moz-box-flex: 1;\n",
-       " box-flex: 1;\n",
-       " flex: 1;\n",
-       "}\n",
-       "div.btn.btn-default.output_collapsed {\n",
-       " background: #1b1f26;\n",
-       " background-color: #1b1f26;\n",
-       " border-color: #1b1f26;\n",
-       "}\n",
-       "div.btn.btn-default.output_collapsed:hover {\n",
-       " background: #161a20;\n",
-       " background-color: #161a20;\n",
-       " border-color: #161a20;\n",
-       "}\n",
-       "div.prompt.output_prompt {\n",
-       " font-family: monospace, monospace;\n",
-       " font-weight: bold !important;\n",
-       " background-color: #323a48;\n",
-       " color: transparent;\n",
-       " border-bottom-left-radius: 4px;\n",
-       " border-top-right-radius: 0px;\n",
-       " border-top-left-radius: 0px;\n",
-       " border-bottom-right-radius: 0px;\n",
-       " min-width: 11.5ex !important;\n",
-       " width: 11.5ex !important;\n",
-       " border-right: 2px solid transparent;\n",
-       "}\n",
-       "div.out_prompt_overlay.prompt {\n",
-       " font-family: monospace, monospace;\n",
-       " font-weight: bold !important;\n",
-       " background-color: #323a48;\n",
-       " border-bottom-left-radius: 2px;\n",
-       " border-top-right-radius: 0px;\n",
-       " border-top-left-radius: 0px;\n",
-       " border-bottom-right-radius: 0px;\n",
-       " min-width: 11.5ex !important;\n",
-       " width: 11.5ex !important;\n",
-       " border-right: 2px solid transparent;\n",
-       " color: transparent;\n",
-       "}\n",
-       "div.out_prompt_overlay.prompt:hover {\n",
-       " background-color: #374556;\n",
-       " box-shadow: none !important;\n",
-       " border: none;\n",
-       " border-bottom-left-radius: 2px;\n",
-       " -webkit-border-: 2px;\n",
-       " -moz-border-radius: 2px;\n",
-       " border-top-right-radius: 0px;\n",
-       " border-top-left-radius: 0px;\n",
-       " min-width: 11.5ex !important;\n",
-       " width: 11.5ex !important;\n",
-       " border-right: 2px solid #374556 !important;\n",
-       "}\n",
-       "div.cell.code_cell .output_prompt {\n",
-       " border-right: 2px solid transparent;\n",
-       " color: transparent;\n",
-       "}\n",
-       "div.cell.selected .output_prompt,\n",
-       "div.cell.selected .out_prompt_overlay.prompt {\n",
-       " border-left: 5px solid #005573;\n",
-       " border-right: 2px solid #323a48;\n",
-       " border-radius: 0px !important;\n",
-       "}\n",
-       ".edit_mode div.cell.selected .output_prompt,\n",
-       ".edit_mode div.cell.selected .out_prompt_overlay.prompt {\n",
-       " border-left: 5px solid #005573;\n",
-       " border-right: 2px solid #323a48;\n",
-       " border-radius: 0px !important;\n",
-       "}\n",
-       "div.text_cell,\n",
-       "div.text_cell_render pre,\n",
-       "div.text_cell_render {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " line-height: 130% !important;\n",
-       " color: #b0bdd7;\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       " border-radius: 0px;\n",
-       "}\n",
-       "div .text_cell_render {\n",
-       " padding: 0.4em 0.4em 0.4em 0.4em;\n",
-       "}\n",
-       "div.cell.text_cell .CodeMirror-lines {\n",
-       " padding-top: .7em !important;\n",
-       " padding-bottom: .4em !important;\n",
-       " padding-left: .5em !important;\n",
-       " padding-right: .5em !important;\n",
-       " margin-top: .4em;\n",
-       " margin-bottom: .3em;\n",
-       "}\n",
-       "div.cell.text_cell.unrendered div.input_area,\n",
-       "div.cell.text_cell.rendered div.input_area {\n",
-       " background-color: #293340;\n",
-       " background: #293340;\n",
-       " border: 0px;\n",
-       " border-radius: 2px;\n",
-       "}\n",
-       "div.cell.text_cell .CodeMirror,\n",
-       "div.cell.text_cell .CodeMirror pre {\n",
-       " line-height: 170% !important;\n",
-       "}\n",
-       "div.cell.text_cell.rendered.selected {\n",
-       " font-family: sans-serif;\n",
-       " line-height: 170% !important;\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       " border-radius: 0px;\n",
-       "}\n",
-       "div.cell.text_cell.unrendered.selected {\n",
-       " font-family: sans-serif;\n",
-       " line-height: 170% !important;\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       " border-radius: 0px;\n",
-       "}\n",
-       "div.cell.text_cell.selected {\n",
-       " font-family: sans-serif;\n",
-       " line-height: 170% !important;\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       " border-radius: 0px;\n",
-       "}\n",
-       ".edit_mode div.cell.text_cell.selected {\n",
-       " font-family: sans-serif;\n",
-       " line-height: 170% !important;\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       " border-radius: 0px;\n",
-       "}\n",
-       "div.text_cell.unrendered,\n",
-       "div.text_cell.unrendered.selected,\n",
-       "div.edit_mode div.text_cell.unrendered {\n",
-       " font-family: sans-serif;\n",
-       " line-height: 170% !important;\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       " border-radius: 0px;\n",
-       "}\n",
-       "div.cell.text_cell .prompt {\n",
-       " border-right: 0;\n",
-       " min-width: 11.5ex !important;\n",
-       " width: 11.5ex !important;\n",
-       "}\n",
-       "div.cell.text_cell.rendered .prompt {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 9.5pt !important;\n",
-       " font-weight: normal;\n",
-       " color: #546386 !important;\n",
-       " text-align: right !important;\n",
-       " min-width: 14.5ex !important;\n",
-       " width: 14.5ex !important;\n",
-       " background-color: #293340;\n",
-       " border-right: 2px solid rgba(0,156,209,.5);\n",
-       " border-left: 4px solid #293340;\n",
-       "}\n",
-       "div.cell.text_cell.unrendered .prompt {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 9.5pt !important;\n",
-       " font-weight: normal;\n",
-       " color: #546386 !important;\n",
-       " text-align: right !important;\n",
-       " min-width: 14.5ex !important;\n",
-       " width: 14.5ex !important;\n",
-       " border-right: 2px solid rgba(0,156,209,.5);\n",
-       " border-left: 4px solid #293340;\n",
-       " background-color: #293340;\n",
-       "}\n",
-       "div.cell.text_cell.rendered .prompt {\n",
-       " border-right: 2px solid rgba(0,156,209,.5);\n",
-       "}\n",
-       "div.cell.text_cell.rendered.selected .prompt {\n",
-       " top: 0;\n",
-       " border-left: 4px solid #0b98c8;\n",
-       " border-right: 2px solid rgba(0,156,209,.5);\n",
-       "}\n",
-       "div.text_cell.unrendered.selected .prompt,\n",
-       "div.text_cell.rendered.selected .prompt {\n",
-       " top: 0;\n",
-       " background: #293340;\n",
-       " border-left: 4px solid #005573;\n",
-       " border-right: 2px solid rgba(0,156,209,.5);\n",
-       "}\n",
-       "div.rendered_html code {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 11pt;\n",
-       " padding-top: 3px;\n",
-       " padding-left: 2px;\n",
-       " color: #cdd2e9;\n",
-       " background: #252e3a;\n",
-       " background-color: #252e3a;\n",
-       "}\n",
-       "pre,\n",
-       "code,\n",
-       "kbd,\n",
-       "samp {\n",
-       " white-space: pre-wrap;\n",
-       "}\n",
-       ".well code,\n",
-       "code {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 11pt !important;\n",
-       " line-height: 170% !important;\n",
-       " color: #b0bdd7;\n",
-       " background: #252e3a;\n",
-       " background-color: #252e3a;\n",
-       " border-color: #252e3a;\n",
-       "}\n",
-       "kbd {\n",
-       " padding: 1px;\n",
-       " font-size: 11pt;\n",
-       " font-weight: 800;\n",
-       " color: #cdd2e9;\n",
-       " background-color: transparent !important;\n",
-       " border: 0;\n",
-       " box-shadow: none;\n",
-       "}\n",
-       "pre {\n",
-       " display: block;\n",
-       " padding: 8.5px;\n",
-       " margin: 0 0 9px;\n",
-       " font-size: 12.0pt;\n",
-       " line-height: 1.42857143;\n",
-       " color: #cdd2e9;\n",
-       " background-color: #252e3a;\n",
-       " border: 1px solid #252e3a;\n",
-       " border-radius: 2px;\n",
-       "}\n",
-       "div.rendered_html {\n",
-       " color: #b0bdd7;\n",
-       "}\n",
-       ".rendered_html * + ul {\n",
-       " margin-top: .4em;\n",
-       " margin-bottom: .3em;\n",
-       "}\n",
-       ".rendered_html * + p {\n",
-       " margin-top: .5em;\n",
-       " margin-bottom: .5em;\n",
-       "}\n",
-       "div.rendered_html pre {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 11pt !important;\n",
-       " line-height: 170% !important;\n",
-       " color: #b0bdd7 !important;\n",
-       " background: #252e3a;\n",
-       " background-color: #252e3a;\n",
-       " max-width: 80%;\n",
-       " border-radius: 0px;\n",
-       " border-left: 3px solid #252e3a;\n",
-       " max-width: 80%;\n",
-       " border-radius: 0px;\n",
-       " padding-left: 5px;\n",
-       " margin-left: 6px;\n",
-       "}\n",
-       "div.text_cell_render pre,\n",
-       "div.text_cell_render code {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 11pt !important;\n",
-       " line-height: 170% !important;\n",
-       " color: #b0bdd7;\n",
-       " background: #1a2028;\n",
-       " background-color: #1a2028;\n",
-       " max-width: 80%;\n",
-       " border-radius: 0px;\n",
-       " border-left: none;\n",
-       "}\n",
-       "div.text_cell_render pre {\n",
-       " border-left: 3px solid rgba(0,156,209,.5) !important;\n",
-       " max-width: 80%;\n",
-       " border-radius: 0px;\n",
-       " padding-left: 5px;\n",
-       " margin-left: 6px;\n",
-       "}\n",
-       "div.text_cell_render h1,\n",
-       "div.rendered_html h1,\n",
-       "div.text_cell_render h2,\n",
-       "div.rendered_html h2,\n",
-       "div.text_cell_render h3,\n",
-       "div.rendered_html h3,\n",
-       "div.text_cell_render h4,\n",
-       "div.rendered_html h4,\n",
-       "div.text_cell_render h5,\n",
-       "div.rendered_html h5 {\n",
-       " font-family: sans-serif;\n",
-       " margin: 0.4em .2em .3em .2em !important;\n",
-       "}\n",
-       ".rendered_html h1:first-child,\n",
-       ".rendered_html h2:first-child,\n",
-       ".rendered_html h3:first-child,\n",
-       ".rendered_html h4:first-child,\n",
-       ".rendered_html h5:first-child,\n",
-       ".rendered_html h6:first-child {\n",
-       " margin-top: 0.2em !important;\n",
-       " margin-bottom: 0.2em !important;\n",
-       "}\n",
-       ".rendered_html h1,\n",
-       ".text_cell_render h1 {\n",
-       " color: #0b98c8 !important;\n",
-       " font-size: 200%;\n",
-       " text-align: left;\n",
-       " font-style: normal;\n",
-       " font-weight: normal;\n",
-       "}\n",
-       ".rendered_html h2,\n",
-       ".text_cell_render h2 {\n",
-       " color: #0b98c8 !important;\n",
-       " font-size: 170%;\n",
-       " font-style: normal;\n",
-       " font-weight: normal;\n",
-       "}\n",
-       ".rendered_html h3,\n",
-       ".text_cell_render h3 {\n",
-       " color: #0b98c8 !important;\n",
-       " font-size: 140%;\n",
-       " font-style: normal;\n",
-       " font-weight: normal;\n",
-       "}\n",
-       ".rendered_html h4,\n",
-       ".text_cell_render h4 {\n",
-       " color: #0b98c8 !important;\n",
-       " font-size: 110%;\n",
-       " font-style: normal;\n",
-       " font-weight: normal;\n",
-       "}\n",
-       ".rendered_html h5,\n",
-       ".text_cell_render h5 {\n",
-       " color: #0b98c8 !important;\n",
-       " font-size: 100%;\n",
-       " font-style: normal;\n",
-       " font-weight: normal;\n",
-       "}\n",
-       "hr {\n",
-       " margin-top: 8px;\n",
-       " margin-bottom: 10px;\n",
-       " border: 0;\n",
-       " border-top: 1px solid #0b98c8;\n",
-       "}\n",
-       ".rendered_html hr {\n",
-       " color: #0b98c8;\n",
-       " background-color: #0b98c8;\n",
-       " margin-right: 2em;\n",
-       "}\n",
-       "#complete > select > option:hover {\n",
-       " background: #323b48;\n",
-       " background-color: #323b48;\n",
-       "}\n",
-       "div#_vivaldi-spatnav-focus-indicator._vivaldi-spatnav-focus-indicator {\n",
-       " position: absolute;\n",
-       " z-index: 9999999999;\n",
-       " top: 0px;\n",
-       " left: 0px;\n",
-       " box-shadow: none;\n",
-       " pointer-events: none;\n",
-       " border-radius: 2px;\n",
-       "}\n",
-       ".rendered_html tr,\n",
-       ".rendered_html th,\n",
-       ".rendered_html td {\n",
-       " text-align: left;\n",
-       " vertical-align: middle;\n",
-       " padding: 0.42em 0.47em;\n",
-       " line-height: normal;\n",
-       " white-space: normal;\n",
-       " max-width: none;\n",
-       " border: none;\n",
-       "}\n",
-       ".rendered_html td {\n",
-       " font-family: sans-serif !important;\n",
-       " font-size: 9.3pt;\n",
-       "}\n",
-       ".rendered_html table {\n",
-       " font-family: sans-serif !important;\n",
-       " margin-left: 8px;\n",
-       " margin-right: auto;\n",
-       " border: none;\n",
-       " border-collapse: collapse;\n",
-       " border-spacing: 0;\n",
-       " color: #e2e5f2;\n",
-       " table-layout: fixed;\n",
-       "}\n",
-       ".rendered_html thead {\n",
-       " font-family: sans-serif !important;\n",
-       " font-size: 10.3pt !important;\n",
-       " background: #27313d;\n",
-       " color: #bbc2e1;\n",
-       " border-bottom: 1px solid #27313d;\n",
-       " vertical-align: bottom;\n",
-       "}\n",
-       ".rendered_html tbody tr:nth-child(odd) {\n",
-       " background: #3f495a;\n",
-       "}\n",
-       ".rendered_html tbody tr {\n",
-       " background: #394251;\n",
-       "}\n",
-       ".rendered_html tbody tr:hover:nth-child(odd) {\n",
-       " background: #3d4757;\n",
-       "}\n",
-       ".rendered_html tbody tr:hover {\n",
-       " background: #373f4e;\n",
-       "}\n",
-       ".rendered_html * + table {\n",
-       " margin-top: .05em;\n",
-       "}\n",
-       "div.widget-area {\n",
-       " background-color: #323a48;\n",
-       " background: #323a48;\n",
-       " color: #b4bcde;\n",
-       "}\n",
-       "div.widget-area a {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 12.0pt;\n",
-       " font-weight: normal;\n",
-       " font-style: normal;\n",
-       " color: #a2b0c7;\n",
-       " text-shadow: none !important;\n",
-       "}\n",
-       "div.widget-area a:hover,\n",
-       "div.widget-area a:focus {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 12.0pt;\n",
-       " font-weight: normal;\n",
-       " font-style: normal;\n",
-       " color: #dbe1ea;\n",
-       " background: rgba(75,95,118,.30);\n",
-       " background-color: rgba(75,95,118,.30);\n",
-       " border-color: transparent;\n",
-       " background-image: none;\n",
-       " text-shadow: none !important;\n",
-       "}\n",
-       "div.widget_item.btn-group > button.btn.btn-default.widget-combo-btn,\n",
-       "div.widget_item.btn-group > button.btn.btn-default.widget-combo-btn:hover {\n",
-       " background: #232932;\n",
-       " background-color: #232932;\n",
-       " border: 2px solid #232932 !important;\n",
-       " font-size: inherit;\n",
-       " z-index: 0;\n",
-       "}\n",
-       "div.jupyter-widgets.widget-hprogress.widget-hbox {\n",
-       " display: inline-table !important;\n",
-       " width: 38% !important;\n",
-       " margin-left: 10px;\n",
-       "}\n",
-       "div.jupyter-widgets.widget-hprogress.widget-hbox .widget-label,\n",
-       "div.widget-hbox .widget-label,\n",
-       ".widget-hbox .widget-label,\n",
-       ".widget-inline-hbox .widget-label,\n",
-       "div.widget-label {\n",
-       " text-align: -webkit-auto !important;\n",
-       " margin-left: 15px !important;\n",
-       " max-width: 240px !important;\n",
-       " min-width: 100px !important;\n",
-       " vertical-align: text-top !important;\n",
-       " color: #b4bcde !important;\n",
-       " font-size: 14px !important;\n",
-       "}\n",
-       ".widget-hprogress .progress {\n",
-       " flex-grow: 1;\n",
-       " height: 20px;\n",
-       " margin-top: auto;\n",
-       " margin-left: 12px;\n",
-       " margin-bottom: auto;\n",
-       " width: 300px;\n",
-       "}\n",
-       ".progress {\n",
-       " overflow: hidden;\n",
-       " height: 22px;\n",
-       " margin-bottom: 10px;\n",
-       " padding-left: 10px;\n",
-       " background-color: #4a5569 !important;\n",
-       " border-radius: 2px;\n",
-       " -webkit-box-shadow: none;\n",
-       " box-shadow: none;\n",
-       " z-index: 10;\n",
-       "}\n",
-       ".progress-bar-danger {\n",
-       " background-color: #e74c3c !important;\n",
-       "}\n",
-       ".progress-bar-info {\n",
-       " background-color: #3498db !important;\n",
-       "}\n",
-       ".progress-bar-warning {\n",
-       " background-color: #ff914d !important;\n",
-       "}\n",
-       ".progress-bar-success {\n",
-       " background-color: #83a83b !important;\n",
-       "}\n",
-       ".widget-select select {\n",
-       " margin-left: 12px;\n",
-       "}\n",
-       ".rendered_html :link {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 100%;\n",
-       " color: #0b98c8;\n",
-       " text-decoration: underline;\n",
-       "}\n",
-       ".rendered_html :visited,\n",
-       ".rendered_html :visited:active,\n",
-       ".rendered_html :visited:focus {\n",
-       " color: #12a3d6;\n",
-       "}\n",
-       ".rendered_html :visited:hover,\n",
-       ".rendered_html :link:hover {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 100%;\n",
-       " color: #0080aa;\n",
-       "}\n",
-       "div.cell.text_cell a.anchor-link:link {\n",
-       " font-size: inherit;\n",
-       " text-decoration: none;\n",
-       " padding: 0px 20px;\n",
-       " visibility: none;\n",
-       " color: rgba(0,0,0,.32);\n",
-       "}\n",
-       "div.cell.text_cell a.anchor-link:link:hover {\n",
-       " font-size: inherit;\n",
-       " color: #0dc1ff;\n",
-       "}\n",
-       ".navbar-text {\n",
-       " margin-top: 4px;\n",
-       " margin-bottom: 0px;\n",
-       "}\n",
-       "#clusters > a {\n",
-       " color: #51c0ef;\n",
-       " text-decoration: underline;\n",
-       " cursor: auto;\n",
-       "}\n",
-       "#clusters > a:hover {\n",
-       " color: #4c8be2;\n",
-       " text-decoration: underline;\n",
-       " cursor: auto;\n",
-       "}\n",
-       "#nbextensions-configurator-container > div.row.container-fluid.nbext-selector > h3 {\n",
-       " font-size: 17px;\n",
-       " margin-top: 5px;\n",
-       " margin-bottom: 8px;\n",
-       " height: 24px;\n",
-       " padding: 4px 0 4px 0;\n",
-       "}\n",
-       "div#nbextensions-configurator-container.container,\n",
-       "#nbextensions-configurator-container.container {\n",
-       " width: 100%;\n",
-       " margin-right: auto;\n",
-       " margin-left: auto;\n",
-       "}\n",
-       "div.nbext-selector > nav > .nav > li > a {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 10.5pt;\n",
-       " padding: 2px 5px;\n",
-       "}\n",
-       "div.nbext-selector > nav > .nav > li > a:hover {\n",
-       " background: transparent;\n",
-       "}\n",
-       "div.nbext-selector > nav > .nav > li:hover {\n",
-       " background-color: rgba(75,95,118,.30) !important;\n",
-       " background: rgba(75,95,118,.30) !important;\n",
-       "}\n",
-       "div.nbext-selector > nav > .nav > li.active:hover {\n",
-       " background: transparent !important;\n",
-       " background-color: transparent !important;\n",
-       "}\n",
-       ".nav-pills > li.active > a,\n",
-       ".nav-pills > li.active > a:active,\n",
-       ".nav-pills > li.active > a:hover,\n",
-       ".nav-pills > li.active > a:focus {\n",
-       " color: #fefefe;\n",
-       " background-color: rgba(75,95,118,.30) !important;\n",
-       " background: rgba(75,95,118,.30) !important;\n",
-       " -webkit-backface-visibility: hidden;\n",
-       " -webkit-font-smoothing: subpixel-antialiased !important;\n",
-       "}\n",
-       "div.nbext-readme > .nbext-readme-contents > .rendered_html {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 11.5pt;\n",
-       " line-height: 145%;\n",
-       " padding: 1em 1em;\n",
-       " color: #b0bdd7;\n",
-       " background-color: #293340;\n",
-       " -webkit-box-shadow: none;\n",
-       " -moz-box-shadow: none;\n",
-       " box-shadow: none;\n",
-       "}\n",
-       ".nbext-icon,\n",
-       ".nbext-desc,\n",
-       ".nbext-compat-div,\n",
-       ".nbext-enable-btns,\n",
-       ".nbext-params {\n",
-       " margin-bottom: 8px;\n",
-       " font-size: 11.5pt;\n",
-       "}\n",
-       "div.nbext-readme > .nbext-readme-contents {\n",
-       " padding: 0;\n",
-       " overflow-y: hidden;\n",
-       "}\n",
-       "div.nbext-readme > .nbext-readme-contents:not(:empty) {\n",
-       " margin-top: 0.5em;\n",
-       " margin-bottom: 2em;\n",
-       " border: none;\n",
-       " border-top-color: rgba(0,156,209,.3);\n",
-       "}\n",
-       ".nbext-showhide-incompat {\n",
-       " padding-bottom: 0.5em;\n",
-       " color: #92a2bd;\n",
-       " font-size: 10.5pt;\n",
-       "}\n",
-       ".nbext-filter-menu.dropdown-menu > li > a:hover,\n",
-       ".nbext-filter-menu.dropdown-menu > li > a:focus,\n",
-       ".nbext-filter-menu.dropdown-menu > li > a.ui-state-focus {\n",
-       " color: #dbe1ea !important;\n",
-       " background-color: #323b48 !important;\n",
-       " background: #323b48 !important;\n",
-       " border-color: #323b48 !important;\n",
-       "}\n",
-       ".nbext-filter-input-wrap > .nbext-filter-input-subwrap,\n",
-       ".nbext-filter-input-wrap > .nbext-filter-input-subwrap > input {\n",
-       " border: none;\n",
-       " outline: none;\n",
-       " background-color: transparent;\n",
-       " padding: 0;\n",
-       " vertical-align: middle;\n",
-       " margin-top: -2px;\n",
-       "}\n",
-       "span.rendered_html code {\n",
-       " background-color: transparent;\n",
-       " color: #a2b0c7;\n",
-       "}\n",
-       "#nbextensions-configurator-container > div.row.container-fluid.nbext-selector {\n",
-       " padding-left: 0px;\n",
-       " padding-right: 0px;\n",
-       "}\n",
-       ".nbext-filter-menu {\n",
-       " max-height: 55vh !important;\n",
-       " overflow-y: auto;\n",
-       " outline: none;\n",
-       " border: none;\n",
-       "}\n",
-       ".nbext-filter-menu:hover {\n",
-       " border: none;\n",
-       "}\n",
-       ".alert-warning {\n",
-       " background-color: #2d3846;\n",
-       " border-color: #2d3846;\n",
-       " color: #a2b0c7;\n",
-       "}\n",
-       ".notification_widget.danger {\n",
-       " color: #ffffff;\n",
-       " background-color: #e74c3c;\n",
-       " border-color: #e74c3c;\n",
-       " padding-right: 5px;\n",
-       "}\n",
-       "#nbextensions-configurator-container > div.nbext-buttons.tree-buttons.no-padding.pull-right > span > button {\n",
-       " border: none !important;\n",
-       "}\n",
-       "button#refresh_running_list {\n",
-       " border: none !important;\n",
-       "}\n",
-       "mark,\n",
-       ".mark {\n",
-       " background-color: #293340;\n",
-       " color: #b0bdd7;\n",
-       " padding: .15em;\n",
-       "}\n",
-       "a.text-warning,\n",
-       "a.text-warning:hover {\n",
-       " color: #546386;\n",
-       "}\n",
-       "a.text-warning.bg-warning {\n",
-       " background-color: #1a2028;\n",
-       "}\n",
-       "span.bg-success.text-success {\n",
-       " background-color: transparent;\n",
-       " color: #48a667;\n",
-       "}\n",
-       "span.bg-danger.text-danger {\n",
-       " background-color: #1a2028;\n",
-       " color: #dc6972;\n",
-       "}\n",
-       ".has-success .input-group-addon {\n",
-       " color: #48a667;\n",
-       " border-color: transparent;\n",
-       " background: inherit;\n",
-       " background-color: rgba(83,180,115,.10);\n",
-       "}\n",
-       ".has-success .form-control {\n",
-       " border-color: #48a667;\n",
-       " -webkit-box-shadow: inset 0 1px 1px rgba(0,0,0,0.025);\n",
-       " box-shadow: inset 0 1px 1px rgba(0,0,0,0.025);\n",
-       "}\n",
-       ".has-error .input-group-addon {\n",
-       " color: #dc6972;\n",
-       " border-color: transparent;\n",
-       " background: inherit;\n",
-       " background-color: rgba(192,57,67,.10);\n",
-       "}\n",
-       ".has-error .form-control {\n",
-       " border-color: #dc6972;\n",
-       " -webkit-box-shadow: inset 0 1px 1px rgba(0,0,0,0.025);\n",
-       " box-shadow: inset 0 1px 1px rgba(0,0,0,0.025);\n",
-       "}\n",
-       ".kse-input-group-pretty > kbd {\n",
-       " font-family: monospace, monospace;\n",
-       " color: #a2b0c7;\n",
-       " font-weight: normal;\n",
-       " background: transparent;\n",
-       "}\n",
-       ".kse-input-group-pretty > kbd {\n",
-       " font-family: monospace, monospace;\n",
-       " color: #a2b0c7;\n",
-       " font-weight: normal;\n",
-       " background: transparent;\n",
-       "}\n",
-       "div.nbext-enable-btns .btn[disabled],\n",
-       "div.nbext-enable-btns .btn[disabled]:hover,\n",
-       ".btn-default.disabled,\n",
-       ".btn-default[disabled] {\n",
-       " background: #232c37;\n",
-       " background-color: #232c37;\n",
-       " color: #98a8c1;\n",
-       "}\n",
-       "label#Keyword-Filter {\n",
-       " display: none;\n",
-       "}\n",
-       ".input-group .nbext-list-btn-add,\n",
-       ".input-group-btn:last-child > .btn-group > .btn {\n",
-       " background: #252b35;\n",
-       " background-color: #252b35;\n",
-       " border-color: #252b35;\n",
-       " border: 2px solid #252b35;\n",
-       "}\n",
-       ".input-group .nbext-list-btn-add:hover,\n",
-       ".input-group-btn:last-child > .btn-group > .btn:hover {\n",
-       " background: #21262f;\n",
-       " background-color: #21262f;\n",
-       " border-color: #21262f;\n",
-       " border: 2px solid #21262f;\n",
-       "}\n",
-       "#notebook-container > div.cell.code_cell.rendered.selected > div.widget-area > div.widget-subarea > div > div.widget_item.btn-group > button.btn.btn-default.dropdown-toggle.widget-combo-carrot-btn {\n",
-       " background: #252b35;\n",
-       " background-color: #252b35;\n",
-       " border-color: #252b35;\n",
-       "}\n",
-       "#notebook-container > div.cell.code_cell.rendered.selected > div.widget-area > div.widget-subarea > div > div.widget_item.btn-group > button.btn.btn-default.dropdown-toggle.widget-combo-carrot-btn:hover {\n",
-       " background: #21262f;\n",
-       " background-color: #21262f;\n",
-       " border-color: #21262f;\n",
-       "}\n",
-       ".ui-widget-content {\n",
-       " background: #252e3a;\n",
-       " background-color: #252e3a;\n",
-       " border: 2px solid #252e3a;\n",
-       " color: #a2b0c7;\n",
-       "}\n",
-       "div.collapsible_headings_toggle {\n",
-       " color: rgba(75,95,118,.55) !important;\n",
-       "}\n",
-       "div.collapsible_headings_toggle:hover {\n",
-       " color: #0b98c8 !important;\n",
-       "}\n",
-       ".collapsible_headings_toggle .h1,\n",
-       ".collapsible_headings_toggle .h2,\n",
-       ".collapsible_headings_toggle .h3,\n",
-       ".collapsible_headings_toggle .h4,\n",
-       ".collapsible_headings_toggle .h5,\n",
-       ".collapsible_headings_toggle .h6 {\n",
-       " margin: 0.3em .4em 0em 0em !important;\n",
-       " line-height: 1.2 !important;\n",
-       "}\n",
-       "div.collapsible_headings_toggle .fa-caret-down:before,\n",
-       "div.collapsible_headings_toggle .fa-caret-right:before {\n",
-       " font-size: xx-large;\n",
-       " transition: transform 1000ms;\n",
-       " transform: none !important;\n",
-       "}\n",
-       ".collapsible_headings_collapsed.collapsible_headings_ellipsis .rendered_html h1:after,\n",
-       ".collapsible_headings_collapsed.collapsible_headings_ellipsis .rendered_html h2:after,\n",
-       ".collapsible_headings_collapsed.collapsible_headings_ellipsis .rendered_html h3:after,\n",
-       ".collapsible_headings_collapsed.collapsible_headings_ellipsis .rendered_html h4:after,\n",
-       ".collapsible_headings_collapsed.collapsible_headings_ellipsis .rendered_html h5:after,\n",
-       ".collapsible_headings_collapsed.collapsible_headings_ellipsis .rendered_html h6:after {\n",
-       " position: absolute;\n",
-       " right: 0;\n",
-       " bottom: 20% !important;\n",
-       " content: \"[\\002026]\";\n",
-       " color: rgba(75,95,118,.55) !important;\n",
-       " padding: 0.5em 0em 0em 0em !important;\n",
-       "}\n",
-       ".collapsible_headings_ellipsis .rendered_html h1,\n",
-       ".collapsible_headings_ellipsis .rendered_html h2,\n",
-       ".collapsible_headings_ellipsis .rendered_html h3,\n",
-       ".collapsible_headings_ellipsis .rendered_html h4,\n",
-       ".collapsible_headings_ellipsis .rendered_html h5,\n",
-       ".collapsible_headings_ellipsis .rendered_html h6,\n",
-       ".collapsible_headings_toggle .fa {\n",
-       " transition: transform 1000ms !important;\n",
-       " -webkit-transform: inherit !important;\n",
-       " -moz-transform: inherit !important;\n",
-       " -ms-transform: inherit !important;\n",
-       " -o-transform: inherit !important;\n",
-       " transform: inherit !important;\n",
-       " padding-right: 0px !important;\n",
-       "}\n",
-       "#toc-wrapper {\n",
-       " z-index: 90;\n",
-       " position: fixed !important;\n",
-       " display: flex;\n",
-       " flex-direction: column;\n",
-       " overflow: hidden;\n",
-       " padding: 10px;\n",
-       " border-style: solid;\n",
-       " border-width: thin;\n",
-       " border-right-width: medium !important;\n",
-       " background-color: #1a2028 !important;\n",
-       "}\n",
-       "#toc-wrapper.ui-draggable.ui-resizable.sidebar-wrapper {\n",
-       " border-color: rgba(75,95,118,.30) !important;\n",
-       "}\n",
-       "#toc a,\n",
-       "#navigate_menu a,\n",
-       ".toc {\n",
-       " color: #a2b0c7 !important;\n",
-       " font-size: 11pt !important;\n",
-       "}\n",
-       "#toc li > span:hover {\n",
-       " background-color: #323b48 !important;\n",
-       "}\n",
-       "#toc a:hover,\n",
-       "#navigate_menu a:hover,\n",
-       ".toc {\n",
-       " color: #fefefe !important;\n",
-       " font-size: 11pt !important;\n",
-       "}\n",
-       "#toc-wrapper .toc-item-num {\n",
-       " color: #0b98c8 !important;\n",
-       " font-size: 11pt !important;\n",
-       "}\n",
-       "input.raw_input {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 11pt !important;\n",
-       " color: #cdd2e9;\n",
-       " background-color: #252e3a;\n",
-       " border-color: #232c37;\n",
-       " background: #232c37;\n",
-       " width: auto;\n",
-       " vertical-align: baseline;\n",
-       " padding: 0em 0.25em;\n",
-       " margin: 0em 0.25em;\n",
-       " -webkit-box-shadow: none;\n",
-       " box-shadow: none;\n",
-       "}\n",
-       "audio,\n",
-       "video {\n",
-       " display: inline;\n",
-       " vertical-align: middle;\n",
-       " align-content: center;\n",
-       " margin-left: 20%;\n",
-       "}\n",
-       ".cmd-palette .modal-body {\n",
-       " padding: 0px;\n",
-       " margin: 0px;\n",
-       "}\n",
-       ".cmd-palette form {\n",
-       " background: #293547;\n",
-       " background-color: #293547;\n",
-       "}\n",
-       ".typeahead-field input:last-child,\n",
-       ".typeahead-hint {\n",
-       " background: #293547;\n",
-       " background-color: #293547;\n",
-       " z-index: 1;\n",
-       "}\n",
-       ".typeahead-field input {\n",
-       " font-family: sans-serif;\n",
-       " color: #cdd2e9;\n",
-       " border: none;\n",
-       " font-size: 28pt;\n",
-       " display: inline-block;\n",
-       " line-height: inherit;\n",
-       " padding: 3px 10px;\n",
-       " height: 70px;\n",
-       "}\n",
-       ".typeahead-select {\n",
-       " background-color: #293547;\n",
-       "}\n",
-       "body > div.modal.cmd-palette.typeahead-field {\n",
-       " display: table;\n",
-       " border-collapse: separate;\n",
-       " background-color: #2b3850;\n",
-       "}\n",
-       ".typeahead-container button {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 28pt;\n",
-       " background-color: #252b35;\n",
-       " border: none;\n",
-       " display: inline-block;\n",
-       " line-height: inherit;\n",
-       " padding: 3px 10px;\n",
-       " height: 70px;\n",
-       "}\n",
-       ".typeahead-search-icon {\n",
-       " min-width: 40px;\n",
-       " min-height: 55px;\n",
-       " display: block;\n",
-       " vertical-align: middle;\n",
-       " text-align: center;\n",
-       "}\n",
-       ".typeahead-container button:focus,\n",
-       ".typeahead-container button:hover {\n",
-       " color: #dbe1ea;\n",
-       " background-color: #21262f;\n",
-       " border-color: #293340;\n",
-       "}\n",
-       ".typeahead-list > li.typeahead-group.active > a,\n",
-       ".typeahead-list > li.typeahead-group > a,\n",
-       ".typeahead-list > li.typeahead-group > a:focus,\n",
-       ".typeahead-list > li.typeahead-group > a:hover {\n",
-       " display: none;\n",
-       "}\n",
-       ".typeahead-dropdown > li > a,\n",
-       ".typeahead-list > li > a {\n",
-       " color: #a2b0c7;\n",
-       " text-decoration: none;\n",
-       "}\n",
-       ".typeahead-dropdown,\n",
-       ".typeahead-list {\n",
-       " font-family: sans-serif;\n",
-       " font-size: 13pt;\n",
-       " color: #a2b0c7;\n",
-       " background-color: #202937;\n",
-       " border: none;\n",
-       " background-clip: padding-box;\n",
-       " margin-top: 0px;\n",
-       " padding: 3px 2px 3px 0px;\n",
-       " line-height: 1.7;\n",
-       "}\n",
-       ".typeahead-dropdown > li.active > a,\n",
-       ".typeahead-dropdown > li > a:focus,\n",
-       ".typeahead-dropdown > li > a:hover,\n",
-       ".typeahead-list > li.active > a,\n",
-       ".typeahead-list > li > a:focus,\n",
-       ".typeahead-list > li > a:hover {\n",
-       " color: #dbe1ea;\n",
-       " background-color: #2b3850;\n",
-       " border-color: #2b3850;\n",
-       "}\n",
-       ".command-shortcut:before {\n",
-       " content: \"(command)\";\n",
-       " padding-right: 3px;\n",
-       " color: #546386;\n",
-       "}\n",
-       ".edit-shortcut:before {\n",
-       " content: \"(edit)\";\n",
-       " padding-right: 3px;\n",
-       " color: #546386;\n",
-       "}\n",
-       "ul.typeahead-list i {\n",
-       " margin-left: 1px;\n",
-       " width: 18px;\n",
-       " margin-right: 10px;\n",
-       "}\n",
-       "ul.typeahead-list {\n",
-       " max-height: 50vh;\n",
-       " overflow: auto;\n",
-       "}\n",
-       ".typeahead-list > li {\n",
-       " position: relative;\n",
-       " border: none;\n",
-       "}\n",
-       "div.input.typeahead-hint,\n",
-       "input.typeahead-hint,\n",
-       "body > div.modal.cmd-palette.in > div > div > div > form > div > div.typeahead-field > span.typeahead-query > input.typeahead-hint {\n",
-       " color: #546386 !important;\n",
-       " background-color: transparent;\n",
-       " padding: 3px 10px;\n",
-       "}\n",
-       ".typeahead-dropdown > li > a,\n",
-       ".typeahead-list > li > a {\n",
-       " display: block;\n",
-       " padding: 5px;\n",
-       " clear: both;\n",
-       " font-weight: 400;\n",
-       " line-height: 1.7;\n",
-       " border: 1px solid #202937;\n",
-       " border-bottom-color: rgba(75,95,118,.55);\n",
-       "}\n",
-       "body > div.modal.cmd-palette.in > div {\n",
-       " min-width: 750px;\n",
-       " margin: 150px auto;\n",
-       "}\n",
-       ".typeahead-container strong {\n",
-       " font-weight: bolder;\n",
-       " color: #0b98c8;\n",
-       "}\n",
-       "#find-and-replace #replace-preview .match,\n",
-       "#find-and-replace #replace-preview .insert {\n",
-       " color: #ffffff;\n",
-       " background-color: #008ebf;\n",
-       " border-color: #008ebf;\n",
-       " border-style: solid;\n",
-       " border-width: 1px;\n",
-       " border-radius: 0px;\n",
-       "}\n",
-       "#find-and-replace #replace-preview .replace .match {\n",
-       " background-color: #dc6972;\n",
-       " border-color: #dc6972;\n",
-       " border-radius: 0px;\n",
-       "}\n",
-       "#find-and-replace #replace-preview .replace .insert {\n",
-       " background-color: #48a667;\n",
-       " border-color: #48a667;\n",
-       " border-radius: 0px;\n",
-       "}\n",
-       ".jupyter-dashboard-menu-item.selected::before {\n",
-       " font-family: 'FontAwesome' !important;\n",
-       " content: '\\f00c' !important;\n",
-       " position: absolute !important;\n",
-       " color: #0b98c8 !important;\n",
-       " left: 0px !important;\n",
-       " top: 13px !important;\n",
-       " font-size: 12px !important;\n",
-       "}\n",
-       ".shortcut_key,\n",
-       "span.shortcut_key {\n",
-       " display: inline-block;\n",
-       " width: 16ex;\n",
-       " text-align: right;\n",
-       " font-family: monospace;\n",
-       "}\n",
-       ".jupyter-keybindings {\n",
-       " padding: 1px;\n",
-       " line-height: 24px;\n",
-       " border-bottom: 1px solid rgba(75,95,118,.30);\n",
-       "}\n",
-       ".jupyter-keybindings i {\n",
-       " background: #252e3a;\n",
-       " font-size: small;\n",
-       " padding: 5px;\n",
-       " margin-left: 7px;\n",
-       "}\n",
-       "div#short-key-bindings-intro.well,\n",
-       ".well {\n",
-       " background-color: #252b35;\n",
-       " border: 1px solid #252b35;\n",
-       " color: #a2b0c7;\n",
-       " border-radius: 2px;\n",
-       " -webkit-box-shadow: none;\n",
-       " box-shadow: none;\n",
-       "}\n",
-       "#texteditor-backdrop {\n",
-       " background: #1a2028;\n",
-       " background-color: #1a2028;\n",
-       "}\n",
-       "#texteditor-backdrop #texteditor-container .CodeMirror-gutter,\n",
-       "#texteditor-backdrop #texteditor-container .CodeMirror-gutters {\n",
-       " background: #334050;\n",
-       " background-color: #334050;\n",
-       " color: #546386;\n",
-       "}\n",
-       ".edit_app #menubar .navbar {\n",
-       " margin-bottom: 0px;\n",
-       "}\n",
-       "#texteditor-backdrop #texteditor-container {\n",
-       " padding: 0px;\n",
-       " background-color: #293340;\n",
-       " box-shadow: none;\n",
-       "}\n",
-       ".terminal-app {\n",
-       " background: #1a2028;\n",
-       "}\n",
-       ".terminal-app > #header {\n",
-       " background: #1a2028;\n",
-       "}\n",
-       ".terminal-app .terminal {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 11pt;\n",
-       " line-height: 170%;\n",
-       " color: #cdd2e9;\n",
-       " background: #293340;\n",
-       " padding: 0.4em;\n",
-       " border-radius: 2px;\n",
-       " -webkit-box-shadow: none;\n",
-       " box-shadow: none;\n",
-       "}\n",
-       ".terminal .xterm-viewport {\n",
-       " background-color: #293340;\n",
-       " color: #cdd2e9;\n",
-       " overflow-y: auto;\n",
-       "}\n",
-       ".terminal .xterm-color-0 {\n",
-       " color: #0b98c8;\n",
-       "}\n",
-       ".terminal .xterm-color-1 {\n",
-       " color: #e17e85;\n",
-       "}\n",
-       ".terminal .xterm-color-2 {\n",
-       " color: #4cb2ff;\n",
-       "}\n",
-       ".terminal .xterm-color-3 {\n",
-       " color: #e17e85;\n",
-       "}\n",
-       ".terminal .xterm-color-4 {\n",
-       " color: #51c0ef;\n",
-       "}\n",
-       ".terminal .xterm-color-5 {\n",
-       " color: #61ba86;\n",
-       "}\n",
-       ".terminal .xterm-color-6 {\n",
-       " color: #be86e3;\n",
-       "}\n",
-       ".terminal .xterm-color-7 {\n",
-       " color: #ffec8e;\n",
-       "}\n",
-       ".terminal .xterm-color-8 {\n",
-       " color: #51c0ef;\n",
-       "}\n",
-       ".terminal .xterm-color-9 {\n",
-       " color: #61ba86;\n",
-       "}\n",
-       ".terminal .xterm-color-10 {\n",
-       " color: #e17e85;\n",
-       "}\n",
-       ".terminal .xterm-color-14 {\n",
-       " color: #be86e3;\n",
-       "}\n",
-       ".terminal .xterm-bg-color-15 {\n",
-       " background-color: #293340;\n",
-       "}\n",
-       ".terminal:not(.xterm-cursor-style-underline):not(.xterm-cursor-style-bar) .terminal-cursor {\n",
-       " background-color: #0b98c8;\n",
-       " color: #293340;\n",
-       "}\n",
-       ".terminal:not(.focus) .terminal-cursor {\n",
-       " outline: 1px solid #0b98c8;\n",
-       " outline-offset: -1px;\n",
-       "}\n",
-       ".celltoolbar {\n",
-       " font-size: 100%;\n",
-       " padding-top: 3px;\n",
-       " border-color: transparent;\n",
-       " border-bottom: thin solid rgba(0,156,209,.3);\n",
-       " background: transparent;\n",
-       "}\n",
-       ".cell-tag,\n",
-       ".tags-input input,\n",
-       ".tags-input button {\n",
-       " color: #a2b0c7;\n",
-       " background-color: #1a2028;\n",
-       " background-image: none;\n",
-       " border: 1px solid #a2b0c7;\n",
-       " border-radius: 1px;\n",
-       " box-shadow: none;\n",
-       " width: inherit;\n",
-       " font-size: inherit;\n",
-       " height: 22px;\n",
-       " line-height: 22px;\n",
-       "}\n",
-       "#notebook-container > div.cell.code_cell.rendered.selected > div.input > div.inner_cell > div.ctb_hideshow.ctb_show > div > div > button,\n",
-       "#notebook-container > div.input > div.inner_cell > div.ctb_hideshow.ctb_show > div > div > button {\n",
-       " font-size: 10pt;\n",
-       " color: #a2b0c7;\n",
-       " background-color: #1a2028;\n",
-       " background-image: none;\n",
-       " border: 1px solid #a2b0c7;\n",
-       " border-radius: 1px;\n",
-       " box-shadow: none;\n",
-       " width: inherit;\n",
-       " font-size: inherit;\n",
-       " height: 22px;\n",
-       " line-height: 22px;\n",
-       "}\n",
-       "div#pager #pager-contents {\n",
-       " background: #1a2028 !important;\n",
-       " background-color: #1a2028 !important;\n",
-       "}\n",
-       "div#pager pre {\n",
-       " color: #cdd2e9 !important;\n",
-       " background: #293340 !important;\n",
-       " background-color: #293340 !important;\n",
-       " padding: 0.4em;\n",
-       "}\n",
-       "div#pager .ui-resizable-handle {\n",
-       " top: 0px;\n",
-       " height: 8px;\n",
-       " background: #0b98c8 !important;\n",
-       " border-top: 1px solid #0b98c8;\n",
-       " border-bottom: 1px solid #0b98c8;\n",
-       "}\n",
-       "div.CodeMirror,\n",
-       "div.CodeMirror pre {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 11pt;\n",
-       " line-height: 170%;\n",
-       " color: #cdd2e9;\n",
-       "}\n",
-       "div.CodeMirror-lines {\n",
-       " padding-bottom: .9em;\n",
-       " padding-left: .5em;\n",
-       " padding-right: 1.5em;\n",
-       " padding-top: .7em;\n",
-       "}\n",
-       "span.ansiblack,\n",
-       ".ansi-black-fg {\n",
-       " color: #2b303b;\n",
-       "}\n",
-       "span.ansiblue,\n",
-       ".ansi-blue-fg,\n",
-       ".ansi-blue-intense-fg {\n",
-       " color: #61afef;\n",
-       "}\n",
-       "span.ansigray,\n",
-       ".ansi-gray-fg,\n",
-       ".ansi-gray-intense-fg {\n",
-       " color: #899ab8;\n",
-       "}\n",
-       "span.ansigreen,\n",
-       ".ansi-green-fg {\n",
-       " color: #8fca9a;\n",
-       "}\n",
-       ".ansi-green-intense-fg {\n",
-       " color: #899ab8;\n",
-       "}\n",
-       "span.ansipurple,\n",
-       ".ansi-purple-fg,\n",
-       ".ansi-purple-intense-fg {\n",
-       " color: #b399ef;\n",
-       "}\n",
-       "span.ansicyan,\n",
-       ".ansi-cyan-fg,\n",
-       ".ansi-cyan-intense-fg {\n",
-       " color: #b399ef;\n",
-       "}\n",
-       "span.ansiyellow,\n",
-       ".ansi-yellow-fg,\n",
-       ".ansi-yellow-intense-fg {\n",
-       " color: #ffec8e;\n",
-       "}\n",
-       "span.ansired,\n",
-       ".ansi-red-fg,\n",
-       ".ansi-red-intense-fg {\n",
-       " color: #e07a7a;\n",
-       "}\n",
-       "div.output-stderr {\n",
-       " background-color: #e07a7a;\n",
-       "}\n",
-       "div.output-stderr pre {\n",
-       " color: #d0d4e6;\n",
-       "}\n",
-       "div.js-error {\n",
-       " color: #e07a7a;\n",
-       "}\n",
-       ".ipython_tooltip {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 11pt;\n",
-       " line-height: 170%;\n",
-       " border: 2px solid #252c36;\n",
-       " background: #363f4e;\n",
-       " background-color: #363f4e;\n",
-       " border-radius: 2px;\n",
-       " overflow-x: visible;\n",
-       " overflow-y: visible;\n",
-       " box-shadow: none;\n",
-       " position: absolute;\n",
-       " z-index: 1000;\n",
-       "}\n",
-       ".ipython_tooltip .tooltiptext pre {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 11pt;\n",
-       " line-height: 170%;\n",
-       " background: #363f4e;\n",
-       " background-color: #363f4e;\n",
-       " color: #cdd2e9;\n",
-       " overflow-x: visible;\n",
-       " overflow-y: visible;\n",
-       " max-width: 900px;\n",
-       "}\n",
-       "div#tooltip.ipython_tooltip {\n",
-       " overflow-x: wrap;\n",
-       " overflow-y: visible;\n",
-       " max-width: 800px;\n",
-       "}\n",
-       "div.tooltiptext.bigtooltip {\n",
-       " overflow-x: visible;\n",
-       " overflow-y: scroll;\n",
-       " height: 400px;\n",
-       " max-width: 800px;\n",
-       "}\n",
-       ".cm-s-ipython.CodeMirror {\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 11pt;\n",
-       " background: #293340;\n",
-       " color: #cdd2e9;\n",
-       " border-radius: 2px;\n",
-       " font-style: normal;\n",
-       " font-weight: normal;\n",
-       "}\n",
-       ".cm-s-ipython div.CodeMirror-selected {\n",
-       " background: #334050;\n",
-       "}\n",
-       ".CodeMirror-gutters {\n",
-       " border: none;\n",
-       " border-right: 1px solid #334050 !important;\n",
-       " background-color: #334050 !important;\n",
-       " background: #334050 !important;\n",
-       " border-radius: 0px;\n",
-       " white-space: nowrap;\n",
-       "}\n",
-       ".cm-s-ipython .CodeMirror-gutters {\n",
-       " background: #334050;\n",
-       " border: none;\n",
-       " border-radius: 0px;\n",
-       " width: 36px;\n",
-       "}\n",
-       ".cm-s-ipython .CodeMirror-linenumber {\n",
-       " color: #546386;\n",
-       "}\n",
-       ".CodeMirror-sizer {\n",
-       " margin-left: 40px;\n",
-       "}\n",
-       ".CodeMirror-linenumber,\n",
-       "div.CodeMirror-linenumber,\n",
-       ".CodeMirror-gutter.CodeMirror-linenumberdiv.CodeMirror-gutter.CodeMirror-linenumber {\n",
-       " padding-right: 1px;\n",
-       " margin-left: 0px;\n",
-       " margin: 0px;\n",
-       " width: 26px !important;\n",
-       " padding: 0px;\n",
-       " text-align: right;\n",
-       "}\n",
-       ".CodeMirror-linenumber {\n",
-       " color: #546386;\n",
-       "}\n",
-       ".cm-s-ipython .CodeMirror-cursor {\n",
-       " border-left: 2px solid #0095ff !important;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-comment {\n",
-       " color: #667fb1;\n",
-       " font-style: italic;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-atom {\n",
-       " color: #be86e3;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-number {\n",
-       " color: #51c0ef;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-property {\n",
-       " color: #cdd2e9;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-attribute {\n",
-       " color: #cdd2e9;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-keyword {\n",
-       " color: #4cb2ff;\n",
-       " font-weight: normal;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-string {\n",
-       " color: #61ba86;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-meta {\n",
-       " color: #ffec8e;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-operator {\n",
-       " color: #00b4ff;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-builtin {\n",
-       " color: #e17e85;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-variable {\n",
-       " color: #cdd2e9;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-variable-2 {\n",
-       " color: #e17e85;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-variable-3 {\n",
-       " color: #ffec8e;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-def {\n",
-       " color: #ffec8e;\n",
-       " font-weight: normal;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-error {\n",
-       " background: rgba(191,97,106,.4);\n",
-       "}\n",
-       ".cm-s-ipython span.cm-tag {\n",
-       " color: #be86e3;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-link {\n",
-       " color: #51c0ef;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-storage {\n",
-       " color: #be86e3;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-entity {\n",
-       " color: #be86e3;\n",
-       "}\n",
-       ".cm-s-ipython span.cm-quote {\n",
-       " color: #61ba86;\n",
-       "}\n",
-       "div.CodeMirror span.CodeMirror-matchingbracket {\n",
-       " color: #ffffff;\n",
-       " font-weight: bold;\n",
-       " background-color: #4c8be2;\n",
-       "}\n",
-       "div.CodeMirror span.CodeMirror-nonmatchingbracket {\n",
-       " color: #ffffff;\n",
-       " font-weight: bold;\n",
-       " background: rgba(191,97,106,.4) !important;\n",
-       "}\n",
-       ".cm-header-1 {\n",
-       " font-size: 215%;\n",
-       "}\n",
-       ".cm-header-2 {\n",
-       " font-size: 180%;\n",
-       "}\n",
-       ".cm-header-3 {\n",
-       " font-size: 150%;\n",
-       "}\n",
-       ".cm-header-4 {\n",
-       " font-size: 120%;\n",
-       "}\n",
-       ".cm-header-5 {\n",
-       " font-size: 100%;\n",
-       "}\n",
-       ".cm-s-default .cm-hr {\n",
-       " color: #00b4ff;\n",
-       "}\n",
-       "div.cell.text_cell .cm-s-default .cm-header {\n",
-       " font-family: sans-serif;\n",
-       " font-weight: normal;\n",
-       " color: #0b98c8 !important;\n",
-       " margin-top: 0.3em !important;\n",
-       " margin-bottom: 0.3em !important;\n",
-       "}\n",
-       "div.cell.text_cell .cm-s-default span.cm-variable-2 {\n",
-       " color: #b0bdd7 !important;\n",
-       "}\n",
-       "div.cell.text_cell .cm-s-default span.cm-variable-3 {\n",
-       " color: #ffec8e !important;\n",
-       "}\n",
-       ".cm-s-default span.cm-comment {\n",
-       " color: #667fb1 !important;\n",
-       "}\n",
-       ".cm-s-default .cm-tag {\n",
-       " color: #8fb36a;\n",
-       "}\n",
-       ".cm-s-default .cm-builtin {\n",
-       " color: #e17e85;\n",
-       "}\n",
-       ".cm-s-default .cm-string {\n",
-       " color: #61ba86;\n",
-       "}\n",
-       ".cm-s-default .cm-keyword {\n",
-       " color: #4cb2ff;\n",
-       "}\n",
-       ".cm-s-default .cm-number {\n",
-       " color: #51c0ef;\n",
-       "}\n",
-       ".cm-s-default .cm-error {\n",
-       " color: #be86e3;\n",
-       "}\n",
-       ".cm-s-default .cm-link {\n",
-       " color: #51c0ef;\n",
-       "}\n",
-       ".cm-s-default .cm-atom {\n",
-       " color: #51c0ef;\n",
-       "}\n",
-       ".cm-s-default .cm-def {\n",
-       " color: #ffec8e;\n",
-       "}\n",
-       ".CodeMirror-cursor {\n",
-       " border-left: 2px solid #0095ff !important;\n",
-       " border-right: none;\n",
-       " width: 0;\n",
-       "}\n",
-       ".cm-s-default div.CodeMirror-selected {\n",
-       " background: #334050;\n",
-       "}\n",
-       ".cm-s-default .cm-selected {\n",
-       " background: #334050;\n",
-       "}\n",
-       ".MathJax_Display,\n",
-       ".MathJax {\n",
-       " border: 0 !important;\n",
-       " font-size: 100% !important;\n",
-       " text-align: center !important;\n",
-       " margin: 0em !important;\n",
-       " line-height: 2.25 !important;\n",
-       "}\n",
-       ".MathJax:focus,\n",
-       "body :focus .MathJax {\n",
-       " display: inline-block !important;\n",
-       "}\n",
-       ".MathJax:focus,\n",
-       "body :focus .MathJax {\n",
-       " display: inline-block !important;\n",
-       "}\n",
-       ".completions {\n",
-       " position: absolute;\n",
-       " z-index: 110;\n",
-       " overflow: hidden;\n",
-       " border: medium solid rgba(0,156,209,.5);\n",
-       " box-shadow: none;\n",
-       " line-height: 1;\n",
-       "}\n",
-       ".completions select {\n",
-       " background: #293340;\n",
-       " background-color: #293340;\n",
-       " outline: none;\n",
-       " border: none;\n",
-       " padding: 0px;\n",
-       " margin: 0px;\n",
-       " margin-left: 2px;\n",
-       " overflow: auto;\n",
-       " font-family: monospace, monospace;\n",
-       " font-size: 11pt;\n",
-       " color: #cdd2e9;\n",
-       " width: auto;\n",
-       "}\n",
-       "div#maintoolbar {\n",
-       " display: none !important;\n",
-       "}\n",
-       "#header-container {\n",
-       " display: none !important;\n",
-       "}\n",
-       "\n",
-       "<script>\n",
-       "    MathJax.Hub.Config({\n",
-       "        \"HTML-CSS\": {\n",
-       "            /*preferredFont: \"TeX\",*/\n",
-       "            /*availableFonts: [\"TeX\", \"STIX\"],*/\n",
-       "            styles: {\n",
-       "                scale: 100,\n",
-       "                \".MathJax_Display\": {\n",
-       "                    \"font-size\": \"100%\",\n",
-       "                }\n",
-       "            }\n",
-       "        }\n",
-       "    });\n",
-       "</script>\n",
-       "     </style>"
-      ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
-      ]
-     },
-     "execution_count": 7,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "from jupyterthemes.stylefx import set_nb_theme\n",
-    "set_nb_theme('chesterish')"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 2,
-   "id": "8c2a24cb",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "os.environ[\"CUDA_DEVICE_ORDER\"]=\"PCI_BUS_ID\"\n",
-    "os.environ[\"CUDA_VISIBLE_DEVICES\"]=\"0\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "id": "f45eb6b0",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "/home/mrbean/.conda/envs/whisper_lightning/lib/python3.10/site-packages/tqdm/auto.py:22: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
-      "  from .autonotebook import tqdm as notebook_tqdm\n",
-      "2023-02-21 15:40:52.888700: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  AVX2 FMA\n",
-      "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
-      "2023-02-21 15:40:53.473104: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory\n",
-      "2023-02-21 15:40:53.473149: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory\n",
-      "2023-02-21 15:40:53.473154: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly.\n"
-     ]
-    }
-   ],
-   "source": [
-    "import numpy as np\n",
-    "import torch\n",
-    "\n",
-    "import datasets \n",
-    "\n",
-    "from datasets import load_dataset, load_metric\n",
-    "\n",
-    "from transformers import (\n",
-    "    AutoModel,\n",
-    "    AutoModelForMaskedLM,\n",
-    "    AutoModelForSeq2SeqLM,\n",
-    "    AutoModelForTokenClassification,\n",
-    "    AutoTokenizer,\n",
-    "    DataCollatorForSeq2Seq,\n",
-    "    pipeline,\n",
-    "    Seq2SeqTrainingArguments,\n",
-    "    Seq2SeqTrainer,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "id": "7fc4eb40",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "/home/mrbean/.conda/envs/whisper_lightning/lib/python3.10/site-packages/transformers/models/t5/tokenization_t5_fast.py:155: FutureWarning: This tokenizer was incorrectly instantiated with a model max length of 512 which will be corrected in Transformers v5.\n",
-      "For now, this behavior is kept to avoid breaking backwards compatibility when padding/encoding with `truncation is True`.\n",
-      "- Be aware that you SHOULD NOT rely on t5-small automatically truncating your input to 512 when padding/encoding.\n",
-      "- If you want to encode/pad to sequences longer than 512 you can either instantiate this tokenizer with `model_max_length` or pass `max_length` when encoding/padding.\n",
-      "- To avoid this warning, please instantiate this tokenizer with `model_max_length` set to your preferred value.\n",
-      "  warnings.warn(\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Load the pre-trained model and tokenizer\n",
-    "model_name = \"t5-small\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(model_name)\n",
-    "model = AutoModelForSeq2SeqLM.from_pretrained(model_name)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 5,
-   "id": "363045f5",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "Found cached dataset cnn_dailymail (/home/mrbean/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/1b3c71476f6d152c31c1730e83ccb08bcf23e348233f4fcc11e182248e6bf7de)\n",
-      "Found cached dataset cnn_dailymail (/home/mrbean/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/1b3c71476f6d152c31c1730e83ccb08bcf23e348233f4fcc11e182248e6bf7de)\n",
-      "100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1122/1122 [02:06<00:00,  8.88ba/s]\n",
-      "Loading cached processed dataset at /home/mrbean/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/1b3c71476f6d152c31c1730e83ccb08bcf23e348233f4fcc11e182248e6bf7de/cache-2d3b7edd75fb1188.arrow\n"
-     ]
-    }
-   ],
-   "source": [
-    "def preprocess_function(batch):\n",
-    "    inputs = tokenizer(batch[\"article\"], padding=\"max_length\", truncation=True, max_length=512)\n",
-    "    outputs = tokenizer(batch[\"highlights\"], padding=\"max_length\", truncation=True, max_length=128)\n",
-    "    batch[\"input_ids\"] = inputs.input_ids\n",
-    "    batch[\"attention_mask\"] = inputs.attention_mask\n",
-    "    batch[\"labels\"] = outputs.input_ids.copy()\n",
-    "    return batch\n",
-    "\n",
-    "# Load the dataset\n",
-    "train_data = load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"train\")\n",
-    "val_data = load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"validation[:10%]\")\n",
-    "\n",
-    "train_ds = train_data.map(\n",
-    "    preprocess_function, \n",
-    "    batched=True, \n",
-    "    batch_size=256, \n",
-    "    remove_columns=[\"article\", \"highlights\", \"id\"]\n",
-    ")\n",
-    "\n",
-    "val_ds = val_data.map(\n",
-    "    preprocess_function, \n",
-    "    batched=True, \n",
-    "    batch_size=256, \n",
-    "    remove_columns=[\"article\", \"highlights\", \"id\"]\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 6,
-   "id": "6faa8c86",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "/tmp/ipykernel_478601/1088570042.py:23: FutureWarning: load_metric is deprecated and will be removed in the next major version of datasets. Use 'evaluate.load' instead, from the new library 🤗 Evaluate: https://huggingface.co/docs/evaluate\n",
-      "  metric = load_metric(\"rouge\")\n",
-      "max_steps is given, it will override any value given in num_train_epochs\n",
-      "Using cuda_amp half precision backend\n",
-      "The following columns in the training set don't have a corresponding argument in `T5ForConditionalGeneration.forward` and have been ignored: id, article, highlights. If id, article, highlights are not expected by `T5ForConditionalGeneration.forward`,  you can safely ignore this message.\n",
-      "/home/mrbean/.conda/envs/whisper_lightning/lib/python3.10/site-packages/transformers/optimization.py:306: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
-      "  warnings.warn(\n",
-      "***** Running training *****\n",
-      "  Num examples = 0\n",
-      "  Num Epochs = 1\n",
-      "  Instantaneous batch size per device = 16\n",
-      "  Total train batch size (w. parallel, distributed & accumulation) = 16\n",
-      "  Gradient Accumulation steps = 1\n",
-      "  Total optimization steps = 5000\n",
-      "  Number of trainable parameters = 60506624\n"
-     ]
-    },
-    {
-     "ename": "IndexError",
-     "evalue": "Invalid key: 90427 is out of bounds for size 0",
-     "output_type": "error",
-     "traceback": [
-      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
-      "\u001b[0;31mIndexError\u001b[0m                                Traceback (most recent call last)",
-      "Cell \u001b[0;32mIn[6], line 47\u001b[0m\n\u001b[1;32m     36\u001b[0m trainer \u001b[38;5;241m=\u001b[39m Seq2SeqTrainer(\n\u001b[1;32m     37\u001b[0m     model\u001b[38;5;241m=\u001b[39mmodel,\n\u001b[1;32m     38\u001b[0m     args\u001b[38;5;241m=\u001b[39mtraining_args,\n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m     43\u001b[0m     compute_metrics\u001b[38;5;241m=\u001b[39mcompute_metrics,\n\u001b[1;32m     44\u001b[0m )\n\u001b[1;32m     46\u001b[0m \u001b[38;5;66;03m# Start the training\u001b[39;00m\n\u001b[0;32m---> 47\u001b[0m \u001b[43mtrainer\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mtrain\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/transformers/trainer.py:1539\u001b[0m, in \u001b[0;36mTrainer.train\u001b[0;34m(self, resume_from_checkpoint, trial, ignore_keys_for_eval, **kwargs)\u001b[0m\n\u001b[1;32m   1534\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel_wrapped \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel\n\u001b[1;32m   1536\u001b[0m inner_training_loop \u001b[38;5;241m=\u001b[39m find_executable_batch_size(\n\u001b[1;32m   1537\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_inner_training_loop, \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_train_batch_size, args\u001b[38;5;241m.\u001b[39mauto_find_batch_size\n\u001b[1;32m   1538\u001b[0m )\n\u001b[0;32m-> 1539\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43minner_training_loop\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m   1540\u001b[0m \u001b[43m    \u001b[49m\u001b[43margs\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1541\u001b[0m \u001b[43m    \u001b[49m\u001b[43mresume_from_checkpoint\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mresume_from_checkpoint\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1542\u001b[0m \u001b[43m    \u001b[49m\u001b[43mtrial\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mtrial\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1543\u001b[0m \u001b[43m    \u001b[49m\u001b[43mignore_keys_for_eval\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mignore_keys_for_eval\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1544\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/transformers/trainer.py:1761\u001b[0m, in \u001b[0;36mTrainer._inner_training_loop\u001b[0;34m(self, batch_size, args, resume_from_checkpoint, trial, ignore_keys_for_eval)\u001b[0m\n\u001b[1;32m   1758\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_load_rng_state(resume_from_checkpoint)\n\u001b[1;32m   1760\u001b[0m step \u001b[38;5;241m=\u001b[39m \u001b[38;5;241m-\u001b[39m\u001b[38;5;241m1\u001b[39m\n\u001b[0;32m-> 1761\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m step, inputs \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28menumerate\u001b[39m(epoch_iterator):\n\u001b[1;32m   1762\u001b[0m \n\u001b[1;32m   1763\u001b[0m     \u001b[38;5;66;03m# Skip past any already trained steps if resuming training\u001b[39;00m\n\u001b[1;32m   1764\u001b[0m     \u001b[38;5;28;01mif\u001b[39;00m steps_trained_in_current_epoch \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m0\u001b[39m:\n\u001b[1;32m   1765\u001b[0m         steps_trained_in_current_epoch \u001b[38;5;241m-\u001b[39m\u001b[38;5;241m=\u001b[39m \u001b[38;5;241m1\u001b[39m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/torch/utils/data/dataloader.py:628\u001b[0m, in \u001b[0;36m_BaseDataLoaderIter.__next__\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m    625\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_sampler_iter \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[1;32m    626\u001b[0m     \u001b[38;5;66;03m# TODO(https://github.com/pytorch/pytorch/issues/76750)\u001b[39;00m\n\u001b[1;32m    627\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_reset()  \u001b[38;5;66;03m# type: ignore[call-arg]\u001b[39;00m\n\u001b[0;32m--> 628\u001b[0m data \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_next_data\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    629\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_num_yielded \u001b[38;5;241m+\u001b[39m\u001b[38;5;241m=\u001b[39m \u001b[38;5;241m1\u001b[39m\n\u001b[1;32m    630\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_dataset_kind \u001b[38;5;241m==\u001b[39m _DatasetKind\u001b[38;5;241m.\u001b[39mIterable \u001b[38;5;129;01mand\u001b[39;00m \\\n\u001b[1;32m    631\u001b[0m         \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_IterableDataset_len_called \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m \u001b[38;5;129;01mand\u001b[39;00m \\\n\u001b[1;32m    632\u001b[0m         \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_num_yielded \u001b[38;5;241m>\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_IterableDataset_len_called:\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/torch/utils/data/dataloader.py:671\u001b[0m, in \u001b[0;36m_SingleProcessDataLoaderIter._next_data\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m    669\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21m_next_data\u001b[39m(\u001b[38;5;28mself\u001b[39m):\n\u001b[1;32m    670\u001b[0m     index \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_next_index()  \u001b[38;5;66;03m# may raise StopIteration\u001b[39;00m\n\u001b[0;32m--> 671\u001b[0m     data \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_dataset_fetcher\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mfetch\u001b[49m\u001b[43m(\u001b[49m\u001b[43mindex\u001b[49m\u001b[43m)\u001b[49m  \u001b[38;5;66;03m# may raise StopIteration\u001b[39;00m\n\u001b[1;32m    672\u001b[0m     \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_pin_memory:\n\u001b[1;32m    673\u001b[0m         data \u001b[38;5;241m=\u001b[39m _utils\u001b[38;5;241m.\u001b[39mpin_memory\u001b[38;5;241m.\u001b[39mpin_memory(data, \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_pin_memory_device)\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/torch/utils/data/_utils/fetch.py:58\u001b[0m, in \u001b[0;36m_MapDatasetFetcher.fetch\u001b[0;34m(self, possibly_batched_index)\u001b[0m\n\u001b[1;32m     56\u001b[0m         data \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mdataset\u001b[38;5;241m.\u001b[39m__getitems__(possibly_batched_index)\n\u001b[1;32m     57\u001b[0m     \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m---> 58\u001b[0m         data \u001b[38;5;241m=\u001b[39m [\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mdataset[idx] \u001b[38;5;28;01mfor\u001b[39;00m idx \u001b[38;5;129;01min\u001b[39;00m possibly_batched_index]\n\u001b[1;32m     59\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m     60\u001b[0m     data \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mdataset[possibly_batched_index]\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/torch/utils/data/_utils/fetch.py:58\u001b[0m, in \u001b[0;36m<listcomp>\u001b[0;34m(.0)\u001b[0m\n\u001b[1;32m     56\u001b[0m         data \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mdataset\u001b[38;5;241m.\u001b[39m__getitems__(possibly_batched_index)\n\u001b[1;32m     57\u001b[0m     \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m---> 58\u001b[0m         data \u001b[38;5;241m=\u001b[39m [\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mdataset\u001b[49m\u001b[43m[\u001b[49m\u001b[43midx\u001b[49m\u001b[43m]\u001b[49m \u001b[38;5;28;01mfor\u001b[39;00m idx \u001b[38;5;129;01min\u001b[39;00m possibly_batched_index]\n\u001b[1;32m     59\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m     60\u001b[0m     data \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mdataset[possibly_batched_index]\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/datasets/arrow_dataset.py:2601\u001b[0m, in \u001b[0;36mDataset.__getitem__\u001b[0;34m(self, key)\u001b[0m\n\u001b[1;32m   2599\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21m__getitem__\u001b[39m(\u001b[38;5;28mself\u001b[39m, key):  \u001b[38;5;66;03m# noqa: F811\u001b[39;00m\n\u001b[1;32m   2600\u001b[0m \u001b[38;5;250m    \u001b[39m\u001b[38;5;124;03m\"\"\"Can be used to index columns (by string names) or rows (by integer index or iterable of indices or bools).\"\"\"\u001b[39;00m\n\u001b[0;32m-> 2601\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_getitem\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m   2602\u001b[0m \u001b[43m        \u001b[49m\u001b[43mkey\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   2603\u001b[0m \u001b[43m    \u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/datasets/arrow_dataset.py:2585\u001b[0m, in \u001b[0;36mDataset._getitem\u001b[0;34m(self, key, **kwargs)\u001b[0m\n\u001b[1;32m   2583\u001b[0m format_kwargs \u001b[38;5;241m=\u001b[39m format_kwargs \u001b[38;5;28;01mif\u001b[39;00m format_kwargs \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m \u001b[38;5;28;01melse\u001b[39;00m {}\n\u001b[1;32m   2584\u001b[0m formatter \u001b[38;5;241m=\u001b[39m get_formatter(format_type, features\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mfeatures, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mformat_kwargs)\n\u001b[0;32m-> 2585\u001b[0m pa_subtable \u001b[38;5;241m=\u001b[39m \u001b[43mquery_table\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_data\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mkey\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mindices\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_indices\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43;01mif\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_indices\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;129;43;01mis\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[38;5;129;43;01mnot\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[38;5;28;43;01mNone\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[38;5;28;43;01melse\u001b[39;49;00m\u001b[43m \u001b[49m\u001b[38;5;28;43;01mNone\u001b[39;49;00m\u001b[43m)\u001b[49m\n\u001b[1;32m   2586\u001b[0m formatted_output \u001b[38;5;241m=\u001b[39m format_table(\n\u001b[1;32m   2587\u001b[0m     pa_subtable, key, formatter\u001b[38;5;241m=\u001b[39mformatter, format_columns\u001b[38;5;241m=\u001b[39mformat_columns, output_all_columns\u001b[38;5;241m=\u001b[39moutput_all_columns\n\u001b[1;32m   2588\u001b[0m )\n\u001b[1;32m   2589\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m formatted_output\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/datasets/formatting/formatting.py:588\u001b[0m, in \u001b[0;36mquery_table\u001b[0;34m(table, key, indices)\u001b[0m\n\u001b[1;32m    586\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m    587\u001b[0m     size \u001b[38;5;241m=\u001b[39m indices\u001b[38;5;241m.\u001b[39mnum_rows \u001b[38;5;28;01mif\u001b[39;00m indices \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m \u001b[38;5;28;01melse\u001b[39;00m table\u001b[38;5;241m.\u001b[39mnum_rows\n\u001b[0;32m--> 588\u001b[0m     \u001b[43m_check_valid_index_key\u001b[49m\u001b[43m(\u001b[49m\u001b[43mkey\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43msize\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    589\u001b[0m \u001b[38;5;66;03m# Query the main table\u001b[39;00m\n\u001b[1;32m    590\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m indices \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/datasets/formatting/formatting.py:531\u001b[0m, in \u001b[0;36m_check_valid_index_key\u001b[0;34m(key, size)\u001b[0m\n\u001b[1;32m    529\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(key, \u001b[38;5;28mint\u001b[39m):\n\u001b[1;32m    530\u001b[0m     \u001b[38;5;28;01mif\u001b[39;00m (key \u001b[38;5;241m<\u001b[39m \u001b[38;5;241m0\u001b[39m \u001b[38;5;129;01mand\u001b[39;00m key \u001b[38;5;241m+\u001b[39m size \u001b[38;5;241m<\u001b[39m \u001b[38;5;241m0\u001b[39m) \u001b[38;5;129;01mor\u001b[39;00m (key \u001b[38;5;241m>\u001b[39m\u001b[38;5;241m=\u001b[39m size):\n\u001b[0;32m--> 531\u001b[0m         \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mIndexError\u001b[39;00m(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mInvalid key: \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mkey\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m is out of bounds for size \u001b[39m\u001b[38;5;132;01m{\u001b[39;00msize\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m    532\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m\n\u001b[1;32m    533\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(key, \u001b[38;5;28mslice\u001b[39m):\n",
-      "\u001b[0;31mIndexError\u001b[0m: Invalid key: 90427 is out of bounds for size 0"
-     ]
-    }
-   ],
-   "source": [
-    "class MyLightningModule(pl.LightningModule):\n",
-    "    def __init__(self, model_name, learning_rate, weight_decay, batch_size, num_training_steps):\n",
-    "        super().__init__()\n",
-    "        self.model_name = model_name\n",
-    "        self.learning_rate = learning_rate\n",
-    "        self.weight_decay = weight_decay\n",
-    "        self.batch_size = batch_size\n",
-    "        self.num_training_steps = num_training_steps\n",
-    "        \n",
-    "        # Load the pre-trained model and tokenizer\n",
-    "        self.tokenizer = AutoTokenizer.from_pretrained(self.model_name)\n",
-    "        self.model = AutoModelForSeq2SeqLM.from_pretrained(self.model_name)\n",
-    "\n",
-    "    def forward(self, input_ids, attention_mask, labels=None):\n",
-    "        output = self.model(\n",
-    "            input_ids=input_ids,\n",
-    "            attention_mask=attention_mask,\n",
-    "            labels=labels,\n",
-    "        )\n",
-    "        return output.loss, output.logits\n",
-    "    \n",
-    "    def training_step(self, batch, batch_idx):\n",
-    "        input_ids = batch[\"input_ids\"]\n",
-    "        attention_mask = batch[\"attention_mask\"]\n",
-    "        labels = batch[\"labels\"]\n",
-    "        \n",
-    "        loss\n",
-    "\n",
-    "# Define the data collator\n",
-    "data_collator = DataCollatorForSeq2Seq(tokenizer, model=model)\n",
-    "\n",
-    "# Initialize the trainer arguments\n",
-    "training_args = Seq2SeqTrainingArguments(\n",
-    "    output_dir=\"./results\",\n",
-    "    learning_rate=1e-5,\n",
-    "    per_device_train_batch_size=16,\n",
-    "    per_device_eval_batch_size=16,\n",
-    "    max_steps=5000,\n",
-    "    weight_decay=1e-4,\n",
-    "    push_to_hub=False,\n",
-    "    evaluation_strategy = \"steps\",\n",
-    "    eval_steps = 50,\n",
-    "    generation_max_length=128,\n",
-    "    predict_with_generate=True,\n",
-    "    logging_steps=100,\n",
-    "    gradient_accumulation_steps=1,\n",
-    "    fp16=True,\n",
-    ")\n",
-    "\n",
-    "# Load the ROUGE metric\n",
-    "metric = load_metric(\"rouge\")\n",
-    "\n",
-    "# Define the evaluation function\n",
-    "def compute_metrics(pred):\n",
-    "    labels = pred.label_ids\n",
-    "    preds = pred.predictions\n",
-    "    decoded_preds = tokenizer.batch_decode(preds, skip_special_tokens=True)\n",
-    "    decoded_labels = tokenizer.batch_decode(labels, skip_special_tokens=True)\n",
-    "    scores = metric.compute(predictions=decoded_preds, references=decoded_labels, rouge_types=[\"rouge1\"])[\"rouge1\"].mid\n",
-    "    return {\"rouge1_precision\": scores.precision, \"rouge1_recall\": scores.recall, \"rouge1_fmeasure\": scores.fmeasure}\n",
-    "\n",
-    "\n",
-    "# Initialize the trainer\n",
-    "trainer = Seq2SeqTrainer(\n",
-    "    model=model,\n",
-    "    args=training_args,\n",
-    "    train_dataset=train_data,\n",
-    "    eval_dataset=val_data,\n",
-    "    data_collator=data_collator,\n",
-    "    tokenizer=tokenizer,\n",
-    "    compute_metrics=compute_metrics,\n",
-    ")\n",
-    "\n",
-    "# Start the training\n",
-    "trainer.train()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1b0f9a76",
-   "metadata": {},
-   "source": [
-    "# Steps:\n",
-    "1. Rewrite code to be more general\n",
-    "\n",
-    "a) Data loading should be from disk rather than their load_dataset, and should be on the fly\n",
-    "\n",
-    "b) Rewrite to Lightning code, Trainer etc using Lightning, compute metric fine that we use huggingface"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "ff03c8bb",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "!nvidia-smi"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "aafc4b27",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.9"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/ML/Pytorch/huggingface/.ipynb_checkpoints/learning-checkpoint.ipynb b/ML/Pytorch/huggingface/.ipynb_checkpoints/learning-checkpoint.ipynb
deleted file mode 100644
index c821b42..0000000
--- a/ML/Pytorch/huggingface/.ipynb_checkpoints/learning-checkpoint.ipynb
+++ /dev/null
@@ -1,644 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": 23,
-   "id": "7d5e92c6",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "[{'entity': 'I-FOOD', 'score': 0.49999642, 'index': 5, 'word': 'Turtle', 'start': 8, 'end': 14}, {'entity': 'I-FOOD', 'score': 0.6096488, 'index': 6, 'word': '##s', 'start': 14, 'end': 15}, {'entity': 'B-FOOD', 'score': 0.45608267, 'index': 7, 'word': 'Original', 'start': 16, 'end': 24}, {'entity': 'I-FOOD', 'score': 0.6613699, 'index': 8, 'word': 'Cara', 'start': 25, 'end': 29}, {'entity': 'I-FOOD', 'score': 0.5776781, 'index': 9, 'word': '##mel', 'start': 29, 'end': 32}, {'entity': 'I-FOOD', 'score': 0.86556953, 'index': 10, 'word': 'Chocolate', 'start': 33, 'end': 42}, {'entity': 'I-FOOD', 'score': 0.96111995, 'index': 11, 'word': 'P', 'start': 43, 'end': 44}, {'entity': 'I-FOOD', 'score': 0.8003402, 'index': 12, 'word': '##eca', 'start': 44, 'end': 47}, {'entity': 'I-FOOD', 'score': 0.9277613, 'index': 13, 'word': '##n', 'start': 47, 'end': 48}, {'entity': 'I-FOOD', 'score': 0.9217512, 'index': 15, 'word': '##luster', 'start': 50, 'end': 56}]\n"
-     ]
-    }
-   ],
-   "source": [
-    "from transformers import AutoTokenizer, AutoModelForTokenClassification\n",
-    "from transformers import pipeline\n",
-    "\n",
-    "tokenizer = AutoTokenizer.from_pretrained(\"Dizex/FoodBaseBERT\")\n",
-    "model = AutoModelForTokenClassification.from_pretrained(\"Dizex/FoodBaseBERT\")\n",
-    "\n",
-    "pipe = pipeline(\"ner\", model=model, tokenizer=tokenizer)\n",
-    "example = \"Demet's Turtles Original Caramel Chocolate Pecan Clusters 9.3 oz Holiday Gift Box\"\n",
-    "\n",
-    "ner_entity_results = pipe(example)\n",
-    "print(ner_entity_results)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 31,
-   "id": "bf67ee76",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Turtle s Original Cara mel Chocolate P eca n luster\n"
-     ]
-    }
-   ],
-   "source": [
-    "ner_entity_results = pipe(example)\n",
-    "\n",
-    "# Initialize the entity words list with an empty string\n",
-    "entity_words = [\"\"]\n",
-    "\n",
-    "# Loop through each dictionary in the list and extract the entity word\n",
-    "for result in ner_entity_results:\n",
-    "    if result[\"entity\"] == \"B-FOOD\":\n",
-    "        entity_words.append(result[\"word\"])\n",
-    "    elif result[\"entity\"] == \"I-FOOD\":\n",
-    "        entity_words[-1] += \" \" + result[\"word\"]\n",
-    "\n",
-    "# Remove any remaining ## symbols and extra spaces\n",
-    "entity_words = [word.replace(\"##\", \"\").strip() for word in entity_words]\n",
-    "\n",
-    "# Join the entity words into a single string\n",
-    "output = \" \".join(entity_words)\n",
-    "\n",
-    "print(output)\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "fc8e5ea0",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import torch\n",
-    "print(torch.cuda.is_available())"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d8a1e039",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import pipeline\n",
-    "import numpy as np"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6ad73024",
-   "metadata": {
-    "scrolled": true
-   },
-   "outputs": [],
-   "source": [
-    "classifier = pipeline(\"zero-shot-classification\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "04f7e02c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "classifier(\n",
-    "    \"This is a course about the Transformers library\",\n",
-    "    candidate_labels=[\"machine learning\", \"gym\", \"food\"],\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6fb246c2",
-   "metadata": {
-    "scrolled": true
-   },
-   "outputs": [],
-   "source": [
-    "from transformers import pipeline\n",
-    "generator = pipeline(task=\"text-generation\", model=\"bigscience/bloom-1b7\", device=0)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "c4e174f0",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import AutoModelForTokenClassification, AutoModel, AutoTokenizer\n",
-    "import torch\n",
-    "\n",
-    "# Define input text and pre-trained model checkpoint\n",
-    "text = \"My name is wolfgang and I live in berlin\"\n",
-    "checkpoint = \"Jean-Baptiste/roberta-large-ner-english\"\n",
-    "\n",
-    "# Instantiate tokenizer and encode input text\n",
-    "tokenizer = AutoTokenizer.from_pretrained(checkpoint)\n",
-    "inputs = tokenizer(text, padding=True, truncation=True, return_tensors=\"pt\")\n",
-    "\n",
-    "# Instantiate model and generate output\n",
-    "model = AutoModel.from_pretrained(checkpoint)\n",
-    "outputs = model(**inputs)\n",
-    "print(outputs[0].shape)\n",
-    "\n",
-    "# Instantiate token classification model and generate predictions\n",
-    "model = AutoModelForTokenClassification.from_pretrained(checkpoint)\n",
-    "outputs = model(**inputs)\n",
-    "predictions = torch.nn.functional.softmax(outputs.logits, dim=-1)\n",
-    "print(predictions)\n",
-    "print(model.config.id2label)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "8212bbaa",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import AutoTokenizer, AutoModelForMaskedLM\n",
-    "\n",
-    "tokenizer = AutoTokenizer.from_pretrained('xlm-roberta-large')\n",
-    "model = AutoModelForMaskedLM.from_pretrained(\"xlm-roberta-large\")\n",
-    "\n",
-    "# prepare input\n",
-    "text = \"Replace me by any text you'd like.\"\n",
-    "encoded_input = tokenizer(text, return_tensors='pt')\n",
-    "\n",
-    "# forward pass\n",
-    "output = model(**encoded_input)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "314cba41",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import AutoTokenizer, AutoModelForMaskedLM\n",
-    "\n",
-    "# Load the pre-trained tokenizer and model\n",
-    "tokenizer = AutoTokenizer.from_pretrained('xlm-roberta-large')\n",
-    "model = AutoModelForMaskedLM.from_pretrained(\"xlm-roberta-large\")\n",
-    "\n",
-    "# Define the input sentence with a masked token\n",
-    "text = \"I want to <mask> a new car tomorrow.\"\n",
-    "\n",
-    "# Tokenize the input sentence, replacing the masked token with a special [MASK] token\n",
-    "encoded_input = tokenizer(text, padding=True, truncation=True, return_tensors='pt')\n",
-    "\n",
-    "print(output.logits.shape)\n",
-    "print(encoded_input['input_ids'][0].tolist().index(tokenizer.mask_token_id))\n",
-    "\n",
-    "# Extract the predicted probabilities for the masked token\n",
-    "predicted_probabilities = output.logits[0, encoded_input['input_ids'][0].tolist().index(tokenizer.mask_token_id)]\n",
-    "predicted_probabilities = torch.nn.functional.softmax(predicted_probabilities, dim=-1)\n",
-    "\n",
-    "# Get the top-k most probable predictions for the masked token\n",
-    "k = 5\n",
-    "top_k = torch.topk(predicted_probabilities, k)\n",
-    "for i in range(k):\n",
-    "    token = tokenizer.convert_ids_to_tokens(top_k.indices[i].item())\n",
-    "    score = top_k.values[i].item()\n",
-    "    print(f\"Prediction {i+1}: '{token}' with probability {score:.5f}\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6187e77e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%%time\n",
-    "tokenizer = AutoTokenizer.from_pretrained(\"bert-base-cased\")\n",
-    "\n",
-    "sequences = [\n",
-    "    \"Using a Transformer network is simple\",\n",
-    "    \"The quick brown fox jumps over the lazy dog\",\n",
-    "    \"To be or not to be, that is the question\"\n",
-    "]\n",
-    "\n",
-    "# Tokenize the input sequences and convert them to padded and truncated integer token IDs\n",
-    "inputs = tokenizer(\n",
-    "    sequences,\n",
-    "    padding=True,\n",
-    "    truncation=True,\n",
-    "    return_tensors=\"pt\"\n",
-    ")\n",
-    "\n",
-    "# Print the resulting input IDs and attention masks\n",
-    "print(inputs['input_ids'])\n",
-    "print(inputs['attention_mask'])"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "fc259c5a",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "markdown",
-   "id": "43466db6",
-   "metadata": {},
-   "source": [
-    "Huggingface:\n",
-    "\n",
-    "1. Understanding how to use the Pipeline (probably most useful) for various tasks, easy to use, and the different subtasks it can do like translation, QA, zero shot, sentiment analysis, token classification, etc. \n",
-    "2. Understood how pipeline works in more detail by using AutoModel for various tasks as well as AutoTokenizer\n",
-    "3. Load dataset\n",
-    "4. How to finetune\n",
-    "5. How to evaluate\n",
-    "6. "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "97c474f2",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "3ed5d8c2",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import torch\n",
-    "from transformers import AdamW, AutoTokenizer, AutoModelForSequenceClassification\n",
-    "\n",
-    "# Same as before\n",
-    "checkpoint = \"bert-base-uncased\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(checkpoint)\n",
-    "model = AutoModelForSequenceClassification.from_pretrained(checkpoint)\n",
-    "sequences = [\n",
-    "    \"I've been waiting for a HuggingFace course my whole life.\",\n",
-    "    \"This course is amazing!\",\n",
-    "]\n",
-    "batch = tokenizer(sequences, padding=True, truncation=True, return_tensors=\"pt\")\n",
-    "\n",
-    "# This is new\n",
-    "batch[\"labels\"] = torch.tensor([1, 1])\n",
-    "\n",
-    "optimizer = AdamW(model.parameters())\n",
-    "loss = model(**batch).loss\n",
-    "loss.backward()\n",
-    "optimizer.step()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "c598624f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from datasets import load_dataset\n",
-    "raw_datasets = load_dataset(\"glue\", \"mrpc\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "cd296227",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "raw_train_dataset = raw_datasets[\"train\"]\n",
-    "raw_train_dataset[0]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e462947a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from datasets import load_dataset\n",
-    "from transformers import AutoTokenizer, DataCollatorWithPadding\n",
-    "raw_datasets = load_dataset(\"glue\", \"mrpc\")\n",
-    "\n",
-    "checkpoint = \"bert-base-uncased\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(checkpoint)\n",
-    "\n",
-    "def tokenize_function(example):\n",
-    "    return tokenizer(example[\"sentence1\"], example[\"sentence2\"], truncation=True)\n",
-    "\n",
-    "\n",
-    "tokenized_datasets = raw_datasets.map(tokenize_function, batched=True)\n",
-    "data_collator = DataCollatorWithPadding(tokenizer=tokenizer)\n",
-    "\n",
-    "\n",
-    "from transformers import TrainingArguments\n",
-    "training_args = TrainingArguments(\"test-trainer\")\n",
-    "\n",
-    "from transformers import AutoModelForSequenceClassification\n",
-    "model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=2)\n",
-    "\n",
-    "import numpy as np\n",
-    "import evaluate\n",
-    "\n",
-    "def compute_metrics(eval_preds):\n",
-    "    metric = evaluate.load(\"glue\", \"mrpc\")\n",
-    "    logits, labels = eval_preds\n",
-    "    predictions = np.argmax(logits, axis=-1)\n",
-    "    return metric.compute(predictions=predictions, references=labels)\n",
-    "\n",
-    "training_args = TrainingArguments(\"test-trainer\", evaluation_strategy=\"epoch\")\n",
-    "model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=2)\n",
-    "\n",
-    "trainer = Trainer(\n",
-    "    model,\n",
-    "    training_args,\n",
-    "    train_dataset=tokenized_datasets[\"train\"],\n",
-    "    eval_dataset=tokenized_datasets[\"validation\"],\n",
-    "    data_collator=data_collator,\n",
-    "    tokenizer=tokenizer,\n",
-    "    compute_metrics=compute_metrics,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0e2795dc",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import TrainingArguments\n",
-    "training_args = TrainingArguments(\"test-trainer\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "3af29cd5",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import AutoModelForSequenceClassification\n",
-    "model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=2)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "817f644e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import numpy as np\n",
-    "import evaluate"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "42819a6c",
-   "metadata": {
-    "scrolled": true
-   },
-   "outputs": [],
-   "source": [
-    "def compute_metrics(eval_preds):\n",
-    "    metric = evaluate.load(\"glue\", \"mrpc\")\n",
-    "    logits, labels = eval_preds\n",
-    "    predictions = np.argmax(logits, axis=-1)\n",
-    "    return metric.compute(predictions=predictions, references=labels)\n",
-    "\n",
-    "training_args = TrainingArguments(\"test-trainer\", evaluation_strategy=\"epoch\")\n",
-    "model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=2)\n",
-    "\n",
-    "trainer = Trainer(\n",
-    "    model,\n",
-    "    training_args,\n",
-    "    train_dataset=tokenized_datasets[\"train\"],\n",
-    "    eval_dataset=tokenized_datasets[\"validation\"],\n",
-    "    data_collator=data_collator,\n",
-    "    tokenizer=tokenizer,\n",
-    "    compute_metrics=compute_metrics,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "eb5986b0",
-   "metadata": {
-    "scrolled": false
-   },
-   "outputs": [],
-   "source": [
-    "from transformers import AutoModelForSeq2SeqLM, AutoTokenizer, DataCollatorForSeq2Seq, Seq2SeqTrainingArguments, Seq2SeqTrainer\n",
-    "from datasets import load_dataset\n",
-    "batch_size=32\n",
-    "\n",
-    "# Define the generator function to preprocess the data in batches\n",
-    "def preprocess_generator(examples):\n",
-    "    for i in range(0, len(examples[\"article\"]), batch_size):\n",
-    "        batch = examples[\"article\"][i:i+batch_size]\n",
-    "        targets = examples[\"highlights\"][i:i+batch_size]\n",
-    "        model_inputs = tokenizer(batch, max_length=512, padding=\"max_length\", truncation=True)\n",
-    "        with tokenizer.as_target_tokenizer():\n",
-    "            model_targets = tokenizer(targets, max_length=128, padding=\"max_length\", truncation=True)\n",
-    "        model_inputs[\"labels\"] = model_targets[\"input_ids\"]\n",
-    "        yield model_inputs\n",
-    "\n",
-    "def preprocess_function(examples):\n",
-    "    articles = [ex for ex in examples[\"article\"]]\n",
-    "    summaries = [ex for ex in examples[\"highlights\"]]\n",
-    "\n",
-    "    model_inputs = tokenizer(articles, max_length=512, padding=\"max_length\", truncation=True)\n",
-    "    with tokenizer.as_target_tokenizer():\n",
-    "        model_targets = tokenizer(summaries, max_length=128, padding=\"max_length\", truncation=True)\n",
-    "    \n",
-    "    model_inputs[\"labels\"] = model_targets[\"input_ids\"]\n",
-    "    return model_inputs\n",
-    "    \n",
-    "# Load the dataset\n",
-    "raw_datasets = load_dataset(\"cnn_dailymail\", \"3.0.0\")\n",
-    "preprocessed_datasets = raw_datasets.map(preprocess_function, batched=True, num_proc=4)\n",
-    "\n",
-    "# Load the pre-trained model and tokenizer\n",
-    "model_name = \"t5-small\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(model_name)\n",
-    "model = AutoModelForSeq2SeqLM.from_pretrained(model_name)\n",
-    "\n",
-    "# Define the data collator\n",
-    "data_collator = DataCollatorForSeq2Seq(tokenizer, model=model)\n",
-    "\n",
-    "# Initialize the trainer arguments\n",
-    "training_args = Seq2SeqTrainingArguments(\n",
-    "    output_dir=\"./results\",\n",
-    "    evaluation_strategy = \"epoch\",\n",
-    "    learning_rate=2e-5,\n",
-    "    per_device_train_batch_size=batch_size,\n",
-    "    max_steps=1000,\n",
-    "    weight_decay=0.01,\n",
-    "    push_to_hub=False,\n",
-    ")\n",
-    "\n",
-    "# Initialize the trainer\n",
-    "trainer = Seq2SeqTrainer(\n",
-    "    model=model,\n",
-    "    args=training_args,\n",
-    "    train_dataset=train_ds,\n",
-    "    data_collator=data_collator,\n",
-    "    tokenizer=tokenizer,\n",
-    ")\n",
-    "\n",
-    "# Start the training\n",
-    "trainer.train()\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7d62583e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from datasets import load_metric"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d310a7b3",
-   "metadata": {
-    "scrolled": true
-   },
-   "outputs": [],
-   "source": [
-    "preprocessed_datasets"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "99d422cc",
-   "metadata": {
-    "scrolled": false
-   },
-   "outputs": [],
-   "source": [
-    "# Load the pre-trained model and tokenizer\n",
-    "model_name = \"t5-small\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(model_name)\n",
-    "model = AutoModelForSeq2SeqLM.from_pretrained(model_name)\n",
-    "\n",
-    "# Define the data collator\n",
-    "data_collator = DataCollatorForSeq2Seq(tokenizer, model=model)\n",
-    "\n",
-    "# Initialize the trainer arguments\n",
-    "training_args = Seq2SeqTrainingArguments(\n",
-    "    output_dir=\"./results\",\n",
-    "    learning_rate=2e-5,\n",
-    "    per_device_train_batch_size=batch_size,\n",
-    "    max_steps=5000,\n",
-    "    weight_decay=0.01,\n",
-    "    push_to_hub=False,\n",
-    "    evaluation_strategy = \"steps\",\n",
-    "    eval_steps = 50,\n",
-    ")\n",
-    "\n",
-    "# Load the ROUGE metric\n",
-    "metric = load_metric(\"rouge\")\n",
-    "\n",
-    "# Define the evaluation function\n",
-    "def compute_metrics(pred):\n",
-    "    labels = pred.label_ids\n",
-    "    preds = pred.predictions\n",
-    "    \n",
-    "    decoded_preds = tokenizer.batch_decode(preds, skip_special_tokens=True)\n",
-    "    decoded_labels = tokenizer.batch_decode(labels, skip_special_tokens=True)\n",
-    "    \n",
-    "    scores = metric.compute(predictions=decoded_preds, references=decoded_labels, rouge_types=[\"rouge1\"])[\"rouge1\"].mid\n",
-    "    \n",
-    "    return {\"rouge1_precision\": scores.precision, \"rouge1_recall\": scores.recall, \"rouge1_fmeasure\": scores.fmeasure}\n",
-    "\n",
-    "\n",
-    "# Initialize the trainer\n",
-    "trainer = Seq2SeqTrainer(\n",
-    "    model=model,\n",
-    "    args=training_args,\n",
-    "    train_dataset=preprocessed_datasets[\"train\"],\n",
-    "    eval_dataset=preprocessed_datasets[\"validation\"],\n",
-    "    data_collator=data_collator,\n",
-    "    tokenizer=tokenizer,\n",
-    "    compute_metrics=compute_metrics,\n",
-    ")\n",
-    "\n",
-    "# Start the training\n",
-    "trainer.train()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "a5e97b57",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "!pip install nltk\n",
-    "!pip install rouge_score"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "558c3e66",
-   "metadata": {},
-   "source": [
-    "# Goal:\n",
-    "\n",
-    "1. Implement full training from dataloading (dailycnn dataset), to model training, evaluation, etc, using HF. \n",
-    "* Right now: stuck on on the fly dataset loading, we don't want to cache because this would take a lot of disk space etc.\n",
-    "\n",
-    "2. After we get step 1) working, we want to go deeper on every step, so download the dataset and load it as a custom dataset rather than using huggingface simple API, in order to make it more general. Compare with loading the ds as a custom HF dataset or using pytorch class together with lightning. Speed difference? Convenience? Also we want to use the lightning Trainer so see how we can integrate that. And then compare HF to the lightning + hf model approach and see what we like the most."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "624d49ca",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.9"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/ML/Pytorch/huggingface/cnndaily_t5_lightning_customdataloading.ipynb b/ML/Pytorch/huggingface/cnndaily_t5_lightning_customdataloading.ipynb
deleted file mode 100644
index a3216e9..0000000
--- a/ML/Pytorch/huggingface/cnndaily_t5_lightning_customdataloading.ipynb
+++ /dev/null
@@ -1,317 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f54ecf0b",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\"\"\"\n",
-    "# HuggingFace Tutorial Series\n",
-    "- 1. What is Huggingface?\n",
-    "- 2. Common tasks we can do with HuggingFace & explain the tasks briefly, like what is question answering etc\n",
-    "- 3. Using the HuggingFace Pipeline (High level feature)\n",
-    "- 4. How the pipeline works at a lower level\n",
-    "- 5. HuggingFace Datasets\n",
-    "- 6. HuggingFace Tokenizer\n",
-    "- 7. HuggingFace Evaluate\n",
-    "- 8. HuggingFace Trainer\n",
-    "- 9. Putting it together to finetune a news article summarizer\n",
-    "- 10. Making it more general and robust with Lightning and custom data loading\n",
-    "\"\"\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "ec1aae37",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import warnings\n",
-    "warnings.simplefilter(\"ignore\")\n",
-    "\n",
-    "import os\n",
-    "os.environ[\"CUDA_DEVICE_ORDER\"]=\"PCI_BUS_ID\"\n",
-    "os.environ[\"CUDA_VISIBLE_DEVICES\"]=\"0\"\n",
-    "\n",
-    "import numpy as np\n",
-    "import torch\n",
-    "import datasets \n",
-    "import pytorch_lightning as pl\n",
-    "from datasets import load_dataset, load_metric\n",
-    "\n",
-    "from transformers import (\n",
-    "    AutoModel,\n",
-    "    AutoModelForSeq2SeqLM,\n",
-    "    AutoTokenizer,\n",
-    "    DataCollatorForSeq2Seq,\n",
-    "    Seq2SeqTrainingArguments,\n",
-    "    Seq2SeqTrainer,\n",
-    ")\n",
-    "\n",
-    "import torch\n",
-    "import pandas as pd\n",
-    "from torch.utils.data import Dataset\n",
-    "import pytorch_lightning as pl\n",
-    "\n",
-    "torch.set_float32_matmul_precision(\"medium\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "5fd7cb0c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "model_name = \"t5-small\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(model_name)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "418cb03a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "class cnn_dailymail(Dataset):\n",
-    "    def __init__(self, csv_file, tokenizer, max_length=512):\n",
-    "        self.data = pd.read_csv(csv_file)\n",
-    "        self.tokenizer = tokenizer\n",
-    "        self.max_length = max_length\n",
-    "\n",
-    "    def __len__(self):\n",
-    "        return len(self.data)\n",
-    "\n",
-    "    def __getitem__(self, idx):\n",
-    "        article = self.data.loc[idx, 'article']\n",
-    "        highlights = self.data.loc[idx, 'highlights']\n",
-    "\n",
-    "        inputs = self.tokenizer(\n",
-    "            article,\n",
-    "            truncation=True,\n",
-    "            padding='max_length',\n",
-    "            max_length=self.max_length,\n",
-    "            return_tensors='pt'\n",
-    "        )\n",
-    "        targets = self.tokenizer(\n",
-    "            highlights,\n",
-    "            truncation=True,\n",
-    "            padding='max_length',\n",
-    "            max_length=self.max_length,\n",
-    "            return_tensors='pt'\n",
-    "        )\n",
-    "\n",
-    "        return {\n",
-    "            'input_ids': inputs['input_ids'].squeeze(),\n",
-    "            'attention_mask': inputs['attention_mask'].squeeze(),\n",
-    "            'labels': targets['input_ids'].squeeze()\n",
-    "        }"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "aaa62755",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "class MyDataModule(pl.LightningDataModule):\n",
-    "    def __init__(self, train_csv, val_csv, test_csv, tokenizer, batch_size=16, max_length=512):\n",
-    "        super().__init__()\n",
-    "        self.train_csv = train_csv\n",
-    "        self.val_csv = val_csv\n",
-    "        self.test_csv = test_csv\n",
-    "        self.tokenizer = tokenizer\n",
-    "        self.batch_size = batch_size\n",
-    "        self.max_length = max_length\n",
-    "\n",
-    "    def setup(self, stage=None):\n",
-    "        if stage in ('fit', None):\n",
-    "            self.train_dataset = cnn_dailymail(self.train_csv, self.tokenizer, self.max_length)\n",
-    "            self.val_dataset = cnn_dailymail(self.val_csv, self.tokenizer, self.max_length)\n",
-    "        if stage in ('test', None):\n",
-    "            self.test_dataset = cnn_dailymail(self.test_csv, self.tokenizer, self.max_length)\n",
-    "\n",
-    "    def train_dataloader(self):\n",
-    "        return torch.utils.data.DataLoader(self.train_dataset, batch_size=self.batch_size, shuffle=True, num_workers=4)\n",
-    "\n",
-    "    def val_dataloader(self):\n",
-    "        return torch.utils.data.DataLoader(self.val_dataset, batch_size=self.batch_size, shuffle=False, num_workers=2)\n",
-    "\n",
-    "    def test_dataloader(self):\n",
-    "        return torch.utils.data.DataLoader(self.test_dataset, batch_size=self.batch_size, shuffle=False, num_workers=2)\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "fbb699e1",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "class MyLightningModule(pl.LightningModule):\n",
-    "    def __init__(self, model_name, learning_rate, weight_decay):\n",
-    "        super().__init__()\n",
-    "        self.model_name = model_name\n",
-    "        self.learning_rate = learning_rate\n",
-    "        self.weight_decay = weight_decay\n",
-    "        \n",
-    "        # Load the pre-trained model and tokenizer\n",
-    "        self.model = torch.compile(AutoModelForSeq2SeqLM.from_pretrained(self.model_name))\n",
-    "        \n",
-    "        # Load the ROUGE metric\n",
-    "        self.metric = load_metric(\"rouge\")\n",
-    "\n",
-    "    def forward(self, input_ids, attention_mask, labels=None):\n",
-    "        output = self.model(\n",
-    "            input_ids=input_ids,\n",
-    "            attention_mask=attention_mask,\n",
-    "            labels=labels,\n",
-    "        )\n",
-    "        return output.loss, output.logits\n",
-    "    \n",
-    "    def training_step(self, batch, batch_idx):\n",
-    "        input_ids = batch[\"input_ids\"]\n",
-    "        attention_mask = batch[\"attention_mask\"]\n",
-    "        labels = batch[\"labels\"]\n",
-    "        loss, logits = self(input_ids, attention_mask, labels)\n",
-    "        self.log('train_loss', loss, on_epoch=True, on_step=True, prog_bar=True)\n",
-    "        return {'loss': loss, 'logits': logits}\n",
-    "    \n",
-    "    def validation_step(self, batch, batch_idx):\n",
-    "        input_ids = batch[\"input_ids\"]\n",
-    "        attention_mask = batch[\"attention_mask\"]\n",
-    "        labels = batch[\"labels\"]\n",
-    "        loss, logits = self(input_ids, attention_mask, labels)\n",
-    "        self.log('val_loss', loss, on_epoch=True, on_step=False)\n",
-    "        \n",
-    "        # Save logits and labels as instance attributes\n",
-    "        if not hasattr(self, \"logits\"):\n",
-    "            self.logits = logits\n",
-    "        else:\n",
-    "            self.logits = torch.cat((self.logits, logits), dim=0)\n",
-    "        \n",
-    "        if not hasattr(self, \"labels\"):\n",
-    "            self.labels = labels\n",
-    "        else:\n",
-    "            self.labels = torch.cat((self.labels, labels), dim=0)\n",
-    "            \n",
-    "        return {'loss': loss, 'logits': logits, \"labels\":labels}\n",
-    "    \n",
-    "    def on_validation_epoch_end(self):\n",
-    "        # Convert logits to predicted token IDs\n",
-    "        pred_token_ids = self.logits.argmax(dim=-1)\n",
-    "\n",
-    "        # Decode predictions and labels using the saved instance attributes\n",
-    "        decoded_preds = tokenizer.batch_decode(pred_token_ids, skip_special_tokens=True)\n",
-    "        decoded_labels = tokenizer.batch_decode(self.labels, skip_special_tokens=True)\n",
-    "\n",
-    "        # Compute ROUGE scores\n",
-    "        scores = self.metric.compute(predictions=decoded_preds, references=decoded_labels, rouge_types=[\"rouge1\"])[\"rouge1\"].mid\n",
-    "\n",
-    "        self.log('rouge1_precision', scores.precision, prog_bar=True)\n",
-    "        self.log('rouge1_recall', scores.recall, prog_bar=True)\n",
-    "        self.log('rouge1_fmeasure', scores.fmeasure, prog_bar=True)\n",
-    "\n",
-    "        # Clear logits and labels instance attributes for the next validation epoch\n",
-    "        del self.logits\n",
-    "        del self.labels\n",
-    "    \n",
-    "    def configure_optimizers(self):\n",
-    "        optimizer = torch.optim.AdamW(self.parameters(), lr=self.learning_rate, weight_decay=self.weight_decay)\n",
-    "        return optimizer\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "dd63c628",
-   "metadata": {
-    "scrolled": true
-   },
-   "outputs": [],
-   "source": [
-    "# File paths\n",
-    "train_csv = \"train.csv\"\n",
-    "val_csv = \"validation.csv\"\n",
-    "test_csv = \"test.csv\"\n",
-    "\n",
-    "# Create the data module\n",
-    "dm = MyDataModule(train_csv, val_csv, test_csv, tokenizer, batch_size=16)\n",
-    "dm.setup()\n",
-    "\n",
-    "model = MyLightningModule(model_name=\"t5-small\", learning_rate=1e-4, weight_decay=1e-5)\n",
-    "trainer = pl.Trainer(accelerator=\"gpu\", devices=[0], max_epochs=1, precision=16)\n",
-    "trainer.fit(model, datamodule=dm)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b5d3d684",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "http://localhost:18888/notebooks/cnndaily_t5_lightning_customdataloading.ipynb"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a0494596",
-   "metadata": {},
-   "source": [
-    "### next steps:\n",
-    "* if article is > 512, because now we are truncating maybe it causes issues if the article is much longer?\n",
-    "\n",
-    "#### what we've done:\n",
-    "* Change the data loading so it's more general, meaning on the fly loading from disk\n",
-    "* add torch.compile\n",
-    "* 1. Clean up the code, make it into scripts instead of notebook -> Train for an epoch (add multi-gpu training?)\n",
-    "* add tensorboard visualization\n",
-    "* not use pretrained weights but from scratch to ensure that training setup works and actually improving\n",
-    "* 2. Create an inference step, send in news article -> get summary, check that it works\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "80a2efab",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0f9b71ab",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.9"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/ML/Pytorch/huggingface/dataset.py b/ML/Pytorch/huggingface/dataset.py
deleted file mode 100644
index 8255e21..0000000
--- a/ML/Pytorch/huggingface/dataset.py
+++ /dev/null
@@ -1,89 +0,0 @@
-import pandas as pd
-import pytorch_lightning as pl
-from torch.utils.data import Dataset
-import torch
-
-
-class cnn_dailymail(Dataset):
-    def __init__(self, csv_file, tokenizer, max_length=512):
-        self.data = pd.read_csv(csv_file)
-
-        # if the csv_file is "train.csv" then only take out 10% of the data. make sure to reset indices etc 
-        #if csv_file == "train.csv":
-        #    self.data = self.data.sample(frac=0.05, random_state=42).reset_index(drop=True)
-
-        self.tokenizer = tokenizer
-        self.max_length = max_length
-
-    def __len__(self):
-        return len(self.data)
-
-    def __getitem__(self, idx):
-        article = self.data.loc[idx, "article"]
-        highlights = self.data.loc[idx, "highlights"]
-
-        inputs = self.tokenizer(
-            article,
-            truncation=True,
-            padding="max_length",
-            max_length=self.max_length,
-            return_tensors="pt",
-        )
-        targets = self.tokenizer(
-            highlights,
-            truncation=True,
-            padding="max_length",
-            max_length=self.max_length,
-            return_tensors="pt",
-        )
-
-        return {
-            "input_ids": inputs["input_ids"].squeeze(),
-            "attention_mask": inputs["attention_mask"].squeeze(),
-            "labels": targets["input_ids"].squeeze(),
-        }
-
-
-class MyDataModule(pl.LightningDataModule):
-    def __init__(
-        self, train_csv, val_csv, test_csv, tokenizer, batch_size=16, max_length=512
-    ):
-        super().__init__()
-        self.train_csv = train_csv
-        self.val_csv = val_csv
-        self.test_csv = test_csv
-        self.tokenizer = tokenizer
-        self.batch_size = batch_size
-        self.max_length = max_length
-
-    def setup(self, stage=None):
-        if stage in ("fit", None):
-            self.train_dataset = cnn_dailymail(
-                self.train_csv, self.tokenizer, self.max_length
-            )
-            self.val_dataset = cnn_dailymail(
-                self.val_csv, self.tokenizer, self.max_length
-            )
-        if stage in ("test", None):
-            self.test_dataset = cnn_dailymail(
-                self.test_csv, self.tokenizer, self.max_length
-            )
-
-    def train_dataloader(self):
-        return torch.utils.data.DataLoader(
-            self.train_dataset,
-            batch_size=self.batch_size,
-            pin_memory=True,
-            shuffle=True,
-            num_workers=6,
-        )
-
-    def val_dataloader(self):
-        return torch.utils.data.DataLoader(
-            self.val_dataset, batch_size=self.batch_size, shuffle=False, num_workers=2
-        )
-
-    def test_dataloader(self):
-        return torch.utils.data.DataLoader(
-            self.test_dataset, batch_size=self.batch_size, shuffle=False, num_workers=1
-        )
diff --git a/ML/Pytorch/huggingface/finetune_t5_lightning.ipynb b/ML/Pytorch/huggingface/finetune_t5_lightning.ipynb
deleted file mode 100644
index da1dc98..0000000
--- a/ML/Pytorch/huggingface/finetune_t5_lightning.ipynb
+++ /dev/null
@@ -1,470 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": 2,
-   "id": "ec1aae37",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2023-02-21 16:36:20.707209: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations:  AVX2 FMA\n",
-      "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
-      "2023-02-21 16:36:21.233575: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory\n",
-      "2023-02-21 16:36:21.233623: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory\n",
-      "2023-02-21 16:36:21.233628: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly.\n"
-     ]
-    }
-   ],
-   "source": [
-    "import warnings\n",
-    "warnings.simplefilter(\"ignore\")\n",
-    "\n",
-    "import os\n",
-    "os.environ[\"CUDA_DEVICE_ORDER\"]=\"PCI_BUS_ID\"\n",
-    "os.environ[\"CUDA_VISIBLE_DEVICES\"]=\"1\"\n",
-    "\n",
-    "import numpy as np\n",
-    "import torch\n",
-    "\n",
-    "import datasets \n",
-    "import pytorch_lightning as pl\n",
-    "\n",
-    "from datasets import load_dataset, load_metric\n",
-    "\n",
-    "from transformers import (\n",
-    "    AutoModel,\n",
-    "    AutoModelForSeq2SeqLM,\n",
-    "    AutoTokenizer,\n",
-    "    DataCollatorForSeq2Seq,\n",
-    "    Seq2SeqTrainingArguments,\n",
-    "    Seq2SeqTrainer,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "id": "5fd7cb0c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "model_name = \"t5-small\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(model_name)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "id": "04530b1e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Define the LightningDataModule\n",
-    "class MyDataModule(pl.LightningDataModule):\n",
-    "    def __init__(self, batch_size):\n",
-    "        super().__init__()\n",
-    "        self.batch_size = batch_size\n",
-    "    \n",
-    "    def prepare_data(self):\n",
-    "        # Download and preprocess the data\n",
-    "        load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"train[:10%]\")\n",
-    "        load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"validation[:10%]\")\n",
-    "    \n",
-    "    def setup(self, stage=None):\n",
-    "        # Load and preprocess the data\n",
-    "        train_data = load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"train[:10%]\")\n",
-    "        val_data = load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"validation[:10%]\")\n",
-    "\n",
-    "        self.train_ds = train_data.map(\n",
-    "            self.preprocess_function, \n",
-    "            batched=True, \n",
-    "            batch_size=self.batch_size, \n",
-    "            remove_columns=[\"article\", \"highlights\", \"id\"]\n",
-    "        )\n",
-    "\n",
-    "        self.val_ds = val_data.map(\n",
-    "            self.preprocess_function, \n",
-    "            batched=True, \n",
-    "            batch_size=self.batch_size,\n",
-    "            remove_columns=[\"article\", \"highlights\", \"id\"]\n",
-    "        )\n",
-    "\n",
-    "    def preprocess_function(self, batch):\n",
-    "        inputs = tokenizer(batch[\"article\"], padding=\"max_length\", truncation=True, max_length=512)\n",
-    "        outputs = tokenizer(batch[\"highlights\"], padding=\"max_length\", truncation=True, max_length=128)\n",
-    "        batch[\"input_ids\"] = inputs.input_ids\n",
-    "        batch[\"attention_mask\"] = inputs.attention_mask\n",
-    "        batch[\"labels\"] = outputs.input_ids.copy()\n",
-    "        return batch\n",
-    "\n",
-    "    def train_dataloader(self):\n",
-    "        return torch.utils.data.DataLoader(self.train_ds, batch_size=self.batch_size)\n",
-    "\n",
-    "    def val_dataloader(self):\n",
-    "        return torch.utils.data.DataLoader(self.val_ds, batch_size=self.batch_size)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 7,
-   "id": "fbb699e1",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "class MyLightningModule(pl.LightningModule):\n",
-    "    def __init__(self, model_name, learning_rate, weight_decay, batch_size):\n",
-    "        super().__init__()\n",
-    "        self.model_name = model_name\n",
-    "        self.learning_rate = learning_rate\n",
-    "        self.weight_decay = weight_decay\n",
-    "        self.batch_size = batch_size\n",
-    "        \n",
-    "        # Load the pre-trained model and tokenizer\n",
-    "        self.model = AutoModelForSeq2SeqLM.from_pretrained(self.model_name)\n",
-    "\n",
-    "        # Load the ROUGE metric\n",
-    "        self.metric = load_metric(\"rouge\")\n",
-    "\n",
-    "    def forward(self, input_ids, attention_mask, labels=None):\n",
-    "        output = self.model(\n",
-    "            input_ids=input_ids,\n",
-    "            attention_mask=attention_mask,\n",
-    "            labels=labels,\n",
-    "        )\n",
-    "        return output.loss, output.logits\n",
-    "    \n",
-    "    def training_step(self, batch, batch_idx):\n",
-    "        input_ids = batch[\"input_ids\"]\n",
-    "        attention_mask = batch[\"attention_mask\"]\n",
-    "        labels = batch[\"labels\"]\n",
-    "        loss, logits = self(input_ids, attention_mask, labels)\n",
-    "        self.log('train_loss', loss, on_epoch=True, on_step=False)\n",
-    "        return {'loss': loss, 'logits': logits}\n",
-    "    \n",
-    "    def validation_step(self, batch, batch_idx):\n",
-    "        input_ids = batch[\"input_ids\"]\n",
-    "        attention_mask = batch[\"attention_mask\"]\n",
-    "        labels = batch[\"labels\"]\n",
-    "        loss, logits = self(input_ids, attention_mask, labels)\n",
-    "        self.log('val_loss', loss, on_epoch=True, on_step=False)\n",
-    "        return {'loss': loss, 'logits': logits, \"labels\":labels}\n",
-    "    \n",
-    "    def validation_epoch_end(self, outputs):\n",
-    "        decoded_preds = []\n",
-    "        decoded_labels = []\n",
-    "        for output in outputs:\n",
-    "            logits = output['logits']\n",
-    "            labels = output['labels']\n",
-    "            decoded_preds += self.tokenizer.batch_decode(logits, skip_special_tokens=True)\n",
-    "            decoded_labels += self.tokenizer.batch_decode(labels, skip_special_tokens=True)\n",
-    "        \n",
-    "        scores = self.metric.compute(predictions=decoded_preds, references=decoded_labels, rouge_types=[\"rouge1\"])[\"rouge1\"].mid\n",
-    "        \n",
-    "        self.log('rouge1_precision', scores.precision, prog_bar=True)\n",
-    "        self.log('rouge1_recall', scores.recall, prog_bar=True)\n",
-    "        self.log('rouge1_fmeasure', scores.fmeasure, prog_bar=True)\n",
-    "    \n",
-    "    def configure_optimizers(self):\n",
-    "        optimizer = torch.optim.AdamW(self.parameters(), lr=self.learning_rate, weight_decay=self.weight_decay)\n",
-    "        return optimizer\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 8,
-   "id": "dd63c628",
-   "metadata": {
-    "scrolled": false
-   },
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "GPU available: True (cuda), used: True\n",
-      "TPU available: False, using: 0 TPU cores\n",
-      "IPU available: False, using: 0 IPUs\n",
-      "HPU available: False, using: 0 HPUs\n",
-      "Found cached dataset cnn_dailymail (/home/mrbean/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/1b3c71476f6d152c31c1730e83ccb08bcf23e348233f4fcc11e182248e6bf7de)\n",
-      "Found cached dataset cnn_dailymail (/home/mrbean/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/1b3c71476f6d152c31c1730e83ccb08bcf23e348233f4fcc11e182248e6bf7de)\n",
-      "Found cached dataset cnn_dailymail (/home/mrbean/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/1b3c71476f6d152c31c1730e83ccb08bcf23e348233f4fcc11e182248e6bf7de)\n",
-      "Found cached dataset cnn_dailymail (/home/mrbean/.cache/huggingface/datasets/cnn_dailymail/3.0.0/3.0.0/1b3c71476f6d152c31c1730e83ccb08bcf23e348233f4fcc11e182248e6bf7de)\n",
-      "\n",
-      "  0%|                                                                                                                                               | 0/1795 [00:00<?, ?ba/s]\u001b[A\n",
-      "  1%|▉                                                                                                                                    | 13/1795 [00:00<00:14, 121.44ba/s]\u001b[A\n",
-      "  1%|█▉                                                                                                                                   | 26/1795 [00:00<00:15, 117.31ba/s]\u001b[A\n",
-      "  2%|██▊                                                                                                                                  | 38/1795 [00:00<00:15, 114.50ba/s]\u001b[A\n",
-      "  3%|███▋                                                                                                                                 | 50/1795 [00:00<00:15, 114.43ba/s]\u001b[A\n",
-      "  3%|████▌                                                                                                                                | 62/1795 [00:00<00:15, 115.53ba/s]\u001b[A\n",
-      "  4%|█████▍                                                                                                                               | 74/1795 [00:00<00:15, 113.50ba/s]\u001b[A\n",
-      "  5%|██████▎                                                                                                                              | 86/1795 [00:00<00:15, 111.92ba/s]\u001b[A\n",
-      "  5%|███████▎                                                                                                                             | 98/1795 [00:00<00:15, 111.38ba/s]\u001b[A\n",
-      "  6%|████████                                                                                                                            | 110/1795 [00:00<00:15, 112.08ba/s]\u001b[A\n",
-      "  7%|████████▉                                                                                                                           | 122/1795 [00:01<00:14, 113.73ba/s]\u001b[A\n",
-      "  7%|█████████▊                                                                                                                          | 134/1795 [00:01<00:14, 113.43ba/s]\u001b[A\n",
-      "  8%|██████████▋                                                                                                                         | 146/1795 [00:01<00:14, 111.37ba/s]\u001b[A\n",
-      "  9%|███████████▌                                                                                                                        | 158/1795 [00:01<00:14, 111.32ba/s]\u001b[A\n",
-      "  9%|████████████▌                                                                                                                       | 170/1795 [00:01<00:14, 110.29ba/s]\u001b[A\n",
-      " 10%|█████████████▍                                                                                                                      | 182/1795 [00:01<00:14, 110.06ba/s]\u001b[A\n",
-      " 11%|██████████████▎                                                                                                                     | 194/1795 [00:01<00:14, 111.06ba/s]\u001b[A\n",
-      " 11%|███████████████▏                                                                                                                    | 206/1795 [00:01<00:14, 111.15ba/s]\u001b[A\n",
-      " 12%|████████████████                                                                                                                    | 218/1795 [00:01<00:14, 110.27ba/s]\u001b[A\n",
-      " 13%|████████████████▉                                                                                                                   | 230/1795 [00:02<00:14, 109.17ba/s]\u001b[A\n",
-      " 13%|█████████████████▋                                                                                                                  | 241/1795 [00:02<00:14, 107.81ba/s]\u001b[A\n",
-      " 14%|██████████████████▌                                                                                                                 | 252/1795 [00:02<00:14, 107.84ba/s]\u001b[A\n",
-      " 15%|███████████████████▎                                                                                                                | 263/1795 [00:02<00:14, 107.73ba/s]\u001b[A\n",
-      " 15%|████████████████████▏                                                                                                               | 274/1795 [00:02<00:14, 107.06ba/s]\u001b[A\n",
-      " 16%|█████████████████████                                                                                                               | 286/1795 [00:02<00:13, 108.37ba/s]\u001b[A\n",
-      " 17%|█████████████████████▊                                                                                                              | 297/1795 [00:02<00:13, 107.89ba/s]\u001b[A\n",
-      " 17%|██████████████████████▋                                                                                                             | 309/1795 [00:02<00:13, 108.63ba/s]\u001b[A\n",
-      " 18%|███████████████████████▌                                                                                                            | 320/1795 [00:02<00:13, 106.85ba/s]\u001b[A\n",
-      " 18%|████████████████████████▎                                                                                                           | 331/1795 [00:03<00:13, 105.16ba/s]\u001b[A\n",
-      " 19%|█████████████████████████▏                                                                                                          | 342/1795 [00:03<00:13, 105.20ba/s]\u001b[A\n",
-      " 20%|█████████████████████████▉                                                                                                          | 353/1795 [00:03<00:13, 106.52ba/s]\u001b[A\n",
-      " 20%|██████████████████████████▊                                                                                                         | 364/1795 [00:03<00:13, 106.07ba/s]\u001b[A\n",
-      " 21%|███████████████████████████▌                                                                                                        | 375/1795 [00:03<00:13, 106.21ba/s]\u001b[A\n",
-      " 22%|████████████████████████████▍                                                                                                       | 386/1795 [00:03<00:13, 106.57ba/s]\u001b[A\n",
-      " 22%|█████████████████████████████▎                                                                                                      | 398/1795 [00:03<00:12, 108.52ba/s]\u001b[A\n",
-      " 23%|██████████████████████████████                                                                                                      | 409/1795 [00:03<00:12, 108.42ba/s]\u001b[A\n",
-      " 23%|██████████████████████████████▉                                                                                                     | 421/1795 [00:03<00:12, 110.30ba/s]\u001b[A\n",
-      " 24%|███████████████████████████████▊                                                                                                    | 433/1795 [00:03<00:12, 108.73ba/s]\u001b[A\n",
-      " 25%|████████████████████████████████▋                                                                                                   | 444/1795 [00:04<00:12, 106.43ba/s]\u001b[A\n",
-      " 25%|█████████████████████████████████▍                                                                                                  | 455/1795 [00:04<00:12, 106.82ba/s]\u001b[A\n",
-      " 26%|██████████████████████████████████▎                                                                                                 | 466/1795 [00:04<00:12, 105.85ba/s]\u001b[A\n",
-      " 27%|███████████████████████████████████                                                                                                 | 477/1795 [00:04<00:12, 107.02ba/s]\u001b[A\n",
-      " 27%|███████████████████████████████████▉                                                                                                | 488/1795 [00:04<00:12, 106.66ba/s]\u001b[A\n",
-      " 28%|████████████████████████████████████▊                                                                                               | 500/1795 [00:04<00:11, 108.59ba/s]\u001b[A\n",
-      " 28%|█████████████████████████████████████▌                                                                                              | 511/1795 [00:04<00:12, 106.49ba/s]\u001b[A\n",
-      " 29%|██████████████████████████████████████▍                                                                                             | 523/1795 [00:04<00:11, 109.26ba/s]\u001b[A\n",
-      " 30%|███████████████████████████████████████▎                                                                                            | 535/1795 [00:04<00:11, 109.78ba/s]\u001b[A\n",
-      " 30%|████████████████████████████████████████▏                                                                                           | 546/1795 [00:04<00:11, 108.30ba/s]\u001b[A\n",
-      " 31%|████████████████████████████████████████▉                                                                                           | 557/1795 [00:05<00:11, 107.77ba/s]\u001b[A\n",
-      " 32%|█████████████████████████████████████████▊                                                                                          | 569/1795 [00:05<00:11, 108.36ba/s]\u001b[A\n",
-      " 32%|██████████████████████████████████████████▋                                                                                         | 580/1795 [00:05<00:11, 107.05ba/s]\u001b[A\n",
-      " 33%|███████████████████████████████████████████▌                                                                                        | 592/1795 [00:05<00:11, 108.48ba/s]\u001b[A\n",
-      " 34%|████████████████████████████████████████████▎                                                                                       | 603/1795 [00:05<00:11, 108.25ba/s]\u001b[A\n",
-      " 34%|█████████████████████████████████████████████▏                                                                                      | 615/1795 [00:05<00:10, 110.59ba/s]\u001b[A\n",
-      " 35%|██████████████████████████████████████████████                                                                                      | 627/1795 [00:05<00:10, 111.44ba/s]\u001b[A\n",
-      " 36%|██████████████████████████████████████████████▉                                                                                     | 639/1795 [00:05<00:10, 109.07ba/s]\u001b[A\n",
-      " 36%|███████████████████████████████████████████████▊                                                                                    | 651/1795 [00:05<00:10, 109.77ba/s]\u001b[A\n",
-      " 37%|████████████████████████████████████████████████▋                                                                                   | 662/1795 [00:06<00:10, 109.69ba/s]\u001b[A\n",
-      " 37%|█████████████████████████████████████████████████▍                                                                                  | 673/1795 [00:06<00:10, 109.08ba/s]\u001b[A\n",
-      " 38%|██████████████████████████████████████████████████▎                                                                                 | 685/1795 [00:06<00:10, 109.77ba/s]\u001b[A\n",
-      " 39%|███████████████████████████████████████████████████▎                                                                                | 697/1795 [00:06<00:10, 109.54ba/s]\u001b[A\n",
-      " 39%|████████████████████████████████████████████████████                                                                                | 708/1795 [00:06<00:09, 109.08ba/s]\u001b[A\n",
-      " 40%|████████████████████████████████████████████████████▉                                                                               | 720/1795 [00:06<00:09, 110.53ba/s]\u001b[A\n",
-      " 41%|█████████████████████████████████████████████████████▊                                                                              | 732/1795 [00:06<00:09, 108.30ba/s]\u001b[A\n",
-      " 41%|██████████████████████████████████████████████████████▋                                                                             | 744/1795 [00:06<00:09, 110.04ba/s]\u001b[A\n",
-      " 42%|███████████████████████████████████████████████████████▌                                                                            | 756/1795 [00:06<00:09, 112.10ba/s]\u001b[A\n",
-      " 43%|████████████████████████████████████████████████████████▍                                                                           | 768/1795 [00:07<00:09, 111.21ba/s]\u001b[A\n",
-      " 43%|█████████████████████████████████████████████████████████▎                                                                          | 780/1795 [00:07<00:09, 111.99ba/s]\u001b[A\n",
-      " 44%|██████████████████████████████████████████████████████████▏                                                                         | 792/1795 [00:07<00:08, 112.21ba/s]\u001b[A\n",
-      " 45%|███████████████████████████████████████████████████████████                                                                         | 804/1795 [00:07<00:09, 109.31ba/s]\u001b[A\n",
-      " 46%|████████████████████████████████████████████████████████████                                                                        | 817/1795 [00:07<00:08, 113.17ba/s]\u001b[A\n",
-      " 46%|████████████████████████████████████████████████████████████▉                                                                       | 829/1795 [00:07<00:08, 113.26ba/s]\u001b[A\n",
-      " 47%|█████████████████████████████████████████████████████████████▊                                                                      | 841/1795 [00:07<00:08, 113.69ba/s]\u001b[A\n",
-      " 48%|██████████████████████████████████████████████████████████████▋                                                                     | 853/1795 [00:07<00:08, 114.08ba/s]\u001b[A\n",
-      " 48%|███████████████████████████████████████████████████████████████▌                                                                    | 865/1795 [00:07<00:08, 112.82ba/s]\u001b[A\n",
-      " 49%|████████████████████████████████████████████████████████████████▍                                                                   | 877/1795 [00:07<00:08, 113.22ba/s]\u001b[A\n",
-      " 50%|█████████████████████████████████████████████████████████████████▍                                                                  | 890/1795 [00:08<00:07, 115.71ba/s]\u001b[A\n",
-      " 50%|██████████████████████████████████████████████████████████████████▎                                                                 | 902/1795 [00:08<00:07, 115.77ba/s]\u001b[A\n",
-      " 51%|███████████████████████████████████████████████████████████████████▏                                                                | 914/1795 [00:08<00:07, 114.07ba/s]\u001b[A\n",
-      " 52%|████████████████████████████████████████████████████████████████████                                                                | 926/1795 [00:08<00:07, 114.19ba/s]\u001b[A\n",
-      " 52%|████████████████████████████████████████████████████████████████████▉                                                               | 938/1795 [00:08<00:07, 115.57ba/s]\u001b[A\n",
-      " 53%|█████████████████████████████████████████████████████████████████████▊                                                              | 950/1795 [00:08<00:07, 115.94ba/s]\u001b[A\n",
-      " 54%|██████████████████████████████████████████████████████████████████████▋                                                             | 962/1795 [00:08<00:07, 116.65ba/s]\u001b[A\n",
-      " 54%|███████████████████████████████████████████████████████████████████████▋                                                            | 974/1795 [00:08<00:07, 113.94ba/s]\u001b[A\n",
-      " 55%|████████████████████████████████████████████████████████████████████████▌                                                           | 986/1795 [00:08<00:07, 111.71ba/s]\u001b[A\n",
-      " 56%|█████████████████████████████████████████████████████████████████████████▍                                                          | 998/1795 [00:09<00:07, 107.78ba/s]\u001b[A\n",
-      " 56%|█████████████████████████████████████████████████████████████████████████▋                                                         | 1009/1795 [00:09<00:07, 105.28ba/s]\u001b[A\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      " 57%|██████████████████████████████████████████████████████████████████████████▌                                                        | 1021/1795 [00:09<00:07, 107.16ba/s]\u001b[A\n",
-      " 57%|███████████████████████████████████████████████████████████████████████████▎                                                       | 1032/1795 [00:09<00:07, 107.83ba/s]\u001b[A\n",
-      " 58%|████████████████████████████████████████████████████████████████████████████▏                                                      | 1044/1795 [00:09<00:06, 109.92ba/s]\u001b[A\n",
-      " 59%|█████████████████████████████████████████████████████████████████████████████                                                      | 1056/1795 [00:09<00:06, 112.47ba/s]\u001b[A\n",
-      " 59%|█████████████████████████████████████████████████████████████████████████████▉                                                     | 1068/1795 [00:09<00:06, 113.56ba/s]\u001b[A\n",
-      " 60%|██████████████████████████████████████████████████████████████████████████████▊                                                    | 1080/1795 [00:09<00:06, 111.84ba/s]\u001b[A\n",
-      " 61%|███████████████████████████████████████████████████████████████████████████████▋                                                   | 1092/1795 [00:09<00:06, 111.27ba/s]\u001b[A\n",
-      " 62%|████████████████████████████████████████████████████████████████████████████████▌                                                  | 1104/1795 [00:10<00:06, 110.39ba/s]\u001b[A\n",
-      " 62%|█████████████████████████████████████████████████████████████████████████████████▍                                                 | 1116/1795 [00:10<00:06, 111.33ba/s]\u001b[A\n",
-      " 63%|██████████████████████████████████████████████████████████████████████████████████▎                                                | 1128/1795 [00:10<00:05, 111.32ba/s]\u001b[A\n",
-      " 64%|███████████████████████████████████████████████████████████████████████████████████▏                                               | 1140/1795 [00:10<00:05, 112.20ba/s]\u001b[A\n",
-      " 64%|████████████████████████████████████████████████████████████████████████████████████▏                                              | 1153/1795 [00:10<00:05, 115.15ba/s]\u001b[A\n",
-      " 65%|█████████████████████████████████████████████████████████████████████████████████████                                              | 1165/1795 [00:10<00:05, 114.07ba/s]\u001b[A\n",
-      " 66%|█████████████████████████████████████████████████████████████████████████████████████▉                                             | 1177/1795 [00:10<00:05, 110.61ba/s]\u001b[A\n",
-      " 66%|██████████████████████████████████████████████████████████████████████████████████████▊                                            | 1189/1795 [00:10<00:05, 110.61ba/s]\u001b[A\n",
-      " 67%|███████████████████████████████████████████████████████████████████████████████████████▋                                           | 1201/1795 [00:10<00:05, 112.56ba/s]\u001b[A\n",
-      " 68%|████████████████████████████████████████████████████████████████████████████████████████▌                                          | 1213/1795 [00:10<00:05, 112.74ba/s]\u001b[A\n",
-      " 68%|█████████████████████████████████████████████████████████████████████████████████████████▍                                         | 1225/1795 [00:11<00:05, 111.53ba/s]\u001b[A\n",
-      " 69%|██████████████████████████████████████████████████████████████████████████████████████████▎                                        | 1237/1795 [00:11<00:05, 110.36ba/s]\u001b[A\n",
-      " 70%|███████████████████████████████████████████████████████████████████████████████████████████▏                                       | 1249/1795 [00:11<00:04, 109.75ba/s]\u001b[A\n",
-      " 70%|███████████████████████████████████████████████████████████████████████████████████████████▉                                       | 1260/1795 [00:11<00:04, 107.40ba/s]\u001b[A\n",
-      " 71%|████████████████████████████████████████████████████████████████████████████████████████████▊                                      | 1271/1795 [00:11<00:04, 106.67ba/s]\u001b[A\n",
-      " 71%|█████████████████████████████████████████████████████████████████████████████████████████████▌                                     | 1282/1795 [00:11<00:04, 106.95ba/s]\u001b[A\n",
-      " 72%|██████████████████████████████████████████████████████████████████████████████████████████████▎                                    | 1293/1795 [00:11<00:04, 107.69ba/s]\u001b[A\n",
-      " 73%|███████████████████████████████████████████████████████████████████████████████████████████████▏                                   | 1304/1795 [00:11<00:04, 107.86ba/s]\u001b[A\n",
-      " 73%|███████████████████████████████████████████████████████████████████████████████████████████████▉                                   | 1315/1795 [00:11<00:04, 107.71ba/s]\u001b[A\n",
-      " 74%|████████████████████████████████████████████████████████████████████████████████████████████████▊                                  | 1326/1795 [00:12<00:04, 107.71ba/s]\u001b[A\n",
-      " 74%|█████████████████████████████████████████████████████████████████████████████████████████████████▌                                 | 1337/1795 [00:12<00:04, 108.29ba/s]\u001b[A\n",
-      " 75%|██████████████████████████████████████████████████████████████████████████████████████████████████▍                                | 1349/1795 [00:12<00:04, 109.37ba/s]\u001b[A\n",
-      " 76%|███████████████████████████████████████████████████████████████████████████████████████████████████▎                               | 1361/1795 [00:12<00:03, 110.19ba/s]\u001b[A\n",
-      " 76%|████████████████████████████████████████████████████████████████████████████████████████████████████▏                              | 1373/1795 [00:12<00:03, 110.42ba/s]\u001b[A\n",
-      " 77%|█████████████████████████████████████████████████████████████████████████████████████████████████████                              | 1385/1795 [00:12<00:03, 111.32ba/s]\u001b[A\n",
-      " 78%|█████████████████████████████████████████████████████████████████████████████████████████████████████▉                             | 1397/1795 [00:12<00:03, 112.54ba/s]\u001b[A\n",
-      " 78%|██████████████████████████████████████████████████████████████████████████████████████████████████████▊                            | 1409/1795 [00:12<00:03, 112.91ba/s]\u001b[A\n",
-      " 79%|███████████████████████████████████████████████████████████████████████████████████████████████████████▋                           | 1421/1795 [00:12<00:03, 111.93ba/s]\u001b[A\n",
-      " 80%|████████████████████████████████████████████████████████████████████████████████████████████████████████▌                          | 1433/1795 [00:12<00:03, 109.91ba/s]\u001b[A\n",
-      " 81%|█████████████████████████████████████████████████████████████████████████████████████████████████████████▍                         | 1445/1795 [00:13<00:03, 109.29ba/s]\u001b[A\n",
-      " 81%|██████████████████████████████████████████████████████████████████████████████████████████████████████████▎                        | 1456/1795 [00:13<00:03, 107.81ba/s]\u001b[A\n",
-      " 82%|███████████████████████████████████████████████████████████████████████████████████████████████████████████                        | 1467/1795 [00:13<00:03, 107.59ba/s]\u001b[A\n",
-      " 82%|███████████████████████████████████████████████████████████████████████████████████████████████████████████▉                       | 1479/1795 [00:13<00:02, 107.83ba/s]\u001b[A\n",
-      " 83%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▊                      | 1491/1795 [00:13<00:02, 108.92ba/s]\u001b[A\n",
-      " 84%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████▌                     | 1502/1795 [00:13<00:02, 108.64ba/s]\u001b[A\n",
-      " 84%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▍                    | 1514/1795 [00:13<00:02, 110.24ba/s]\u001b[A\n",
-      " 85%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████▎                   | 1526/1795 [00:13<00:02, 111.64ba/s]\u001b[A\n",
-      " 86%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏                  | 1538/1795 [00:13<00:02, 110.08ba/s]\u001b[A\n",
-      " 86%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████                  | 1550/1795 [00:14<00:02, 108.01ba/s]\u001b[A\n",
-      " 87%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉                 | 1562/1795 [00:14<00:02, 109.96ba/s]\u001b[A\n",
-      " 88%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊                | 1574/1795 [00:14<00:02, 109.67ba/s]\u001b[A\n",
-      " 88%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋               | 1585/1795 [00:14<00:01, 107.92ba/s]\u001b[A\n",
-      " 89%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍              | 1596/1795 [00:14<00:01, 108.38ba/s]\u001b[A\n",
-      " 90%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍             | 1609/1795 [00:14<00:01, 112.44ba/s]\u001b[A\n",
-      " 90%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎            | 1621/1795 [00:14<00:01, 110.29ba/s]\u001b[A\n",
-      " 91%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏           | 1633/1795 [00:14<00:01, 110.18ba/s]\u001b[A\n",
-      " 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████           | 1645/1795 [00:14<00:01, 108.21ba/s]\u001b[A\n",
-      " 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊          | 1656/1795 [00:15<00:01, 107.62ba/s]\u001b[A\n",
-      " 93%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋         | 1667/1795 [00:15<00:01, 106.66ba/s]\u001b[A\n",
-      " 93%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍        | 1678/1795 [00:15<00:01, 104.97ba/s]\u001b[A\n",
-      " 94%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎       | 1689/1795 [00:15<00:01, 105.67ba/s]\u001b[A\n",
-      " 95%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████       | 1700/1795 [00:15<00:00, 106.08ba/s]\u001b[A\n",
-      " 95%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉      | 1712/1795 [00:15<00:00, 107.07ba/s]\u001b[A\n",
-      " 96%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊     | 1724/1795 [00:15<00:00, 108.53ba/s]\u001b[A\n",
-      " 97%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌    | 1735/1795 [00:15<00:00, 108.05ba/s]\u001b[A\n",
-      " 97%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍   | 1747/1795 [00:15<00:00, 110.64ba/s]\u001b[A\n",
-      " 98%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎  | 1759/1795 [00:15<00:00, 111.38ba/s]\u001b[A\n",
-      " 99%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏ | 1771/1795 [00:16<00:00, 110.67ba/s]\u001b[A\n",
-      " 99%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 1783/1795 [00:16<00:00, 110.52ba/s]\u001b[A\n",
-      "100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1795/1795 [00:16<00:00, 109.98ba/s]\u001b[A\n",
-      "\n",
-      "  0%|                                                                                                                                                 | 0/84 [00:00<?, ?ba/s]\u001b[A\n",
-      " 14%|███████████████████▎                                                                                                                   | 12/84 [00:00<00:00, 110.99ba/s]\u001b[A\n",
-      " 29%|██████████████████████████████████████▌                                                                                                | 24/84 [00:00<00:00, 110.80ba/s]\u001b[A\n",
-      " 43%|█████████████████████████████████████████████████████████▊                                                                             | 36/84 [00:00<00:00, 107.75ba/s]\u001b[A\n",
-      " 56%|███████████████████████████████████████████████████████████████████████████▌                                                           | 47/84 [00:00<00:00, 103.83ba/s]\u001b[A\n",
-      " 69%|█████████████████████████████████████████████████████████████████████████████████████████████▏                                         | 58/84 [00:00<00:00, 102.87ba/s]\u001b[A\n",
-      " 82%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▉                        | 69/84 [00:00<00:00, 104.54ba/s]\u001b[A\n",
-      "100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 84/84 [00:00<00:00, 106.09ba/s]\u001b[A\n",
-      "LOCAL_RANK: 0 - CUDA_VISIBLE_DEVICES: [1]\n",
-      "\n",
-      "  | Name  | Type                       | Params\n",
-      "-----------------------------------------------------\n",
-      "0 | model | T5ForConditionalGeneration | 60.5 M\n",
-      "-----------------------------------------------------\n",
-      "60.5 M    Trainable params\n",
-      "0         Non-trainable params\n",
-      "60.5 M    Total params\n",
-      "242.026   Total estimated model params size (MB)\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Sanity Checking DataLoader 0:   0%|                                                                                                                    | 0/2 [00:00<?, ?it/s]"
-     ]
-    },
-    {
-     "ename": "AttributeError",
-     "evalue": "'list' object has no attribute 'size'",
-     "output_type": "error",
-     "traceback": [
-      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
-      "\u001b[0;31mAttributeError\u001b[0m                            Traceback (most recent call last)",
-      "Cell \u001b[0;32mIn[8], line 5\u001b[0m\n\u001b[1;32m      3\u001b[0m trainer \u001b[38;5;241m=\u001b[39m pl\u001b[38;5;241m.\u001b[39mTrainer(accelerator\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mgpu\u001b[39m\u001b[38;5;124m\"\u001b[39m, devices\u001b[38;5;241m=\u001b[39m[\u001b[38;5;241m0\u001b[39m], max_epochs\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m10\u001b[39m)\n\u001b[1;32m      4\u001b[0m dm \u001b[38;5;241m=\u001b[39m MyDataModule(batch_size\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m16\u001b[39m)\n\u001b[0;32m----> 5\u001b[0m \u001b[43mtrainer\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mfit\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mdatamodule\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mdm\u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:608\u001b[0m, in \u001b[0;36mTrainer.fit\u001b[0;34m(self, model, train_dataloaders, val_dataloaders, datamodule, ckpt_path)\u001b[0m\n\u001b[1;32m    606\u001b[0m     \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mTypeError\u001b[39;00m(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m`Trainer.fit()` requires a `LightningModule`, got: \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mmodel\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__class__\u001b[39m\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__qualname__\u001b[39m\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m    607\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mstrategy\u001b[38;5;241m.\u001b[39m_lightning_module \u001b[38;5;241m=\u001b[39m model\n\u001b[0;32m--> 608\u001b[0m \u001b[43mcall\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_call_and_handle_interrupt\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m    609\u001b[0m \u001b[43m    \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_fit_impl\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mmodel\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mtrain_dataloaders\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mval_dataloaders\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mdatamodule\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mckpt_path\u001b[49m\n\u001b[1;32m    610\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/call.py:38\u001b[0m, in \u001b[0;36m_call_and_handle_interrupt\u001b[0;34m(trainer, trainer_fn, *args, **kwargs)\u001b[0m\n\u001b[1;32m     36\u001b[0m         \u001b[38;5;28;01mreturn\u001b[39;00m trainer\u001b[38;5;241m.\u001b[39mstrategy\u001b[38;5;241m.\u001b[39mlauncher\u001b[38;5;241m.\u001b[39mlaunch(trainer_fn, \u001b[38;5;241m*\u001b[39margs, trainer\u001b[38;5;241m=\u001b[39mtrainer, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)\n\u001b[1;32m     37\u001b[0m     \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m---> 38\u001b[0m         \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mtrainer_fn\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     40\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m _TunerExitException:\n\u001b[1;32m     41\u001b[0m     trainer\u001b[38;5;241m.\u001b[39m_call_teardown_hook()\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:650\u001b[0m, in \u001b[0;36mTrainer._fit_impl\u001b[0;34m(self, model, train_dataloaders, val_dataloaders, datamodule, ckpt_path)\u001b[0m\n\u001b[1;32m    643\u001b[0m ckpt_path \u001b[38;5;241m=\u001b[39m ckpt_path \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mresume_from_checkpoint\n\u001b[1;32m    644\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_ckpt_path \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_checkpoint_connector\u001b[38;5;241m.\u001b[39m_set_ckpt_path(\n\u001b[1;32m    645\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mstate\u001b[38;5;241m.\u001b[39mfn,\n\u001b[1;32m    646\u001b[0m     ckpt_path,  \u001b[38;5;66;03m# type: ignore[arg-type]\u001b[39;00m\n\u001b[1;32m    647\u001b[0m     model_provided\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m,\n\u001b[1;32m    648\u001b[0m     model_connected\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlightning_module \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m,\n\u001b[1;32m    649\u001b[0m )\n\u001b[0;32m--> 650\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_run\u001b[49m\u001b[43m(\u001b[49m\u001b[43mmodel\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mckpt_path\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mckpt_path\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    652\u001b[0m \u001b[38;5;28;01massert\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mstate\u001b[38;5;241m.\u001b[39mstopped\n\u001b[1;32m    653\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mtraining \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:1103\u001b[0m, in \u001b[0;36mTrainer._run\u001b[0;34m(self, model, ckpt_path)\u001b[0m\n\u001b[1;32m   1099\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_checkpoint_connector\u001b[38;5;241m.\u001b[39mrestore_training_state()\n\u001b[1;32m   1101\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_checkpoint_connector\u001b[38;5;241m.\u001b[39mresume_end()\n\u001b[0;32m-> 1103\u001b[0m results \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_run_stage\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1105\u001b[0m log\u001b[38;5;241m.\u001b[39mdetail(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;132;01m{\u001b[39;00m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__class__\u001b[39m\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__name__\u001b[39m\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m: trainer tearing down\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m   1106\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_teardown()\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:1182\u001b[0m, in \u001b[0;36mTrainer._run_stage\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m   1180\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mpredicting:\n\u001b[1;32m   1181\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_run_predict()\n\u001b[0;32m-> 1182\u001b[0m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_run_train\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:1195\u001b[0m, in \u001b[0;36mTrainer._run_train\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m   1192\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_pre_training_routine()\n\u001b[1;32m   1194\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m isolate_rng():\n\u001b[0;32m-> 1195\u001b[0m     \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_run_sanity_check\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1197\u001b[0m \u001b[38;5;66;03m# enable train mode\u001b[39;00m\n\u001b[1;32m   1198\u001b[0m \u001b[38;5;28;01massert\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:1267\u001b[0m, in \u001b[0;36mTrainer._run_sanity_check\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m   1265\u001b[0m \u001b[38;5;66;03m# run eval step\u001b[39;00m\n\u001b[1;32m   1266\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m torch\u001b[38;5;241m.\u001b[39mno_grad():\n\u001b[0;32m-> 1267\u001b[0m     \u001b[43mval_loop\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrun\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1269\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_call_callback_hooks(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mon_sanity_check_end\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m   1271\u001b[0m \u001b[38;5;66;03m# reset logger connector\u001b[39;00m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/loops/loop.py:199\u001b[0m, in \u001b[0;36mLoop.run\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m    197\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[1;32m    198\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mon_advance_start(\u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)\n\u001b[0;32m--> 199\u001b[0m     \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43madvance\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    200\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mon_advance_end()\n\u001b[1;32m    201\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_restarting \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/loops/dataloader/evaluation_loop.py:152\u001b[0m, in \u001b[0;36mEvaluationLoop.advance\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m    150\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mnum_dataloaders \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m1\u001b[39m:\n\u001b[1;32m    151\u001b[0m     kwargs[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mdataloader_idx\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m=\u001b[39m dataloader_idx\n\u001b[0;32m--> 152\u001b[0m dl_outputs \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mepoch_loop\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrun\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_data_fetcher\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mdl_max_batches\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    154\u001b[0m \u001b[38;5;66;03m# store batch level output per dataloader\u001b[39;00m\n\u001b[1;32m    155\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_outputs\u001b[38;5;241m.\u001b[39mappend(dl_outputs)\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/loops/loop.py:199\u001b[0m, in \u001b[0;36mLoop.run\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m    197\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[1;32m    198\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mon_advance_start(\u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)\n\u001b[0;32m--> 199\u001b[0m     \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43madvance\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    200\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mon_advance_end()\n\u001b[1;32m    201\u001b[0m     \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_restarting \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/loops/epoch/evaluation_epoch_loop.py:137\u001b[0m, in \u001b[0;36mEvaluationEpochLoop.advance\u001b[0;34m(self, data_fetcher, dl_max_batches, kwargs)\u001b[0m\n\u001b[1;32m    134\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mbatch_progress\u001b[38;5;241m.\u001b[39mincrement_started()\n\u001b[1;32m    136\u001b[0m \u001b[38;5;66;03m# lightning module methods\u001b[39;00m\n\u001b[0;32m--> 137\u001b[0m output \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_evaluation_step\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    138\u001b[0m output \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_evaluation_step_end(output)\n\u001b[1;32m    140\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mbatch_progress\u001b[38;5;241m.\u001b[39mincrement_processed()\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/loops/epoch/evaluation_epoch_loop.py:234\u001b[0m, in \u001b[0;36mEvaluationEpochLoop._evaluation_step\u001b[0;34m(self, **kwargs)\u001b[0m\n\u001b[1;32m    223\u001b[0m \u001b[38;5;250m\u001b[39m\u001b[38;5;124;03m\"\"\"The evaluation step (validation_step or test_step depending on the trainer's state).\u001b[39;00m\n\u001b[1;32m    224\u001b[0m \n\u001b[1;32m    225\u001b[0m \u001b[38;5;124;03mArgs:\u001b[39;00m\n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m    231\u001b[0m \u001b[38;5;124;03m    the outputs of the step\u001b[39;00m\n\u001b[1;32m    232\u001b[0m \u001b[38;5;124;03m\"\"\"\u001b[39;00m\n\u001b[1;32m    233\u001b[0m hook_name \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mtest_step\u001b[39m\u001b[38;5;124m\"\u001b[39m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mtrainer\u001b[38;5;241m.\u001b[39mtesting \u001b[38;5;28;01melse\u001b[39;00m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mvalidation_step\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[0;32m--> 234\u001b[0m output \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mtrainer\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_call_strategy_hook\u001b[49m\u001b[43m(\u001b[49m\u001b[43mhook_name\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mvalues\u001b[49m\u001b[43m(\u001b[49m\u001b[43m)\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    236\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m output\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/trainer/trainer.py:1485\u001b[0m, in \u001b[0;36mTrainer._call_strategy_hook\u001b[0;34m(self, hook_name, *args, **kwargs)\u001b[0m\n\u001b[1;32m   1482\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m\n\u001b[1;32m   1484\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mprofiler\u001b[38;5;241m.\u001b[39mprofile(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m[Strategy]\u001b[39m\u001b[38;5;132;01m{\u001b[39;00m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mstrategy\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__class__\u001b[39m\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__name__\u001b[39m\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m.\u001b[39m\u001b[38;5;132;01m{\u001b[39;00mhook_name\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m):\n\u001b[0;32m-> 1485\u001b[0m     output \u001b[38;5;241m=\u001b[39m \u001b[43mfn\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1487\u001b[0m \u001b[38;5;66;03m# restore current_fx when nested context\u001b[39;00m\n\u001b[1;32m   1488\u001b[0m pl_module\u001b[38;5;241m.\u001b[39m_current_fx_name \u001b[38;5;241m=\u001b[39m prev_fx_name\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/pytorch_lightning/strategies/strategy.py:390\u001b[0m, in \u001b[0;36mStrategy.validation_step\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m    388\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mprecision_plugin\u001b[38;5;241m.\u001b[39mval_step_context():\n\u001b[1;32m    389\u001b[0m     \u001b[38;5;28;01massert\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mmodel, ValidationStep)\n\u001b[0;32m--> 390\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mvalidation_step\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n",
-      "Cell \u001b[0;32mIn[7], line 36\u001b[0m, in \u001b[0;36mMyLightningModule.validation_step\u001b[0;34m(self, batch, batch_idx)\u001b[0m\n\u001b[1;32m     34\u001b[0m attention_mask \u001b[38;5;241m=\u001b[39m batch[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mattention_mask\u001b[39m\u001b[38;5;124m\"\u001b[39m]\n\u001b[1;32m     35\u001b[0m labels \u001b[38;5;241m=\u001b[39m batch[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mlabels\u001b[39m\u001b[38;5;124m\"\u001b[39m]\n\u001b[0;32m---> 36\u001b[0m loss, logits \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[43m(\u001b[49m\u001b[43minput_ids\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mattention_mask\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mlabels\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     37\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlog(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mval_loss\u001b[39m\u001b[38;5;124m'\u001b[39m, loss, on_epoch\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m, on_step\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mFalse\u001b[39;00m)\n\u001b[1;32m     38\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m {\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mloss\u001b[39m\u001b[38;5;124m'\u001b[39m: loss, \u001b[38;5;124m'\u001b[39m\u001b[38;5;124mlogits\u001b[39m\u001b[38;5;124m'\u001b[39m: logits, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mlabels\u001b[39m\u001b[38;5;124m\"\u001b[39m:labels}\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/torch/nn/modules/module.py:1194\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *input, **kwargs)\u001b[0m\n\u001b[1;32m   1190\u001b[0m \u001b[38;5;66;03m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m   1191\u001b[0m \u001b[38;5;66;03m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m   1192\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m (\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m   1193\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> 1194\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mforward_call\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;28;43minput\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1195\u001b[0m \u001b[38;5;66;03m# Do not call functions when jit is used\u001b[39;00m\n\u001b[1;32m   1196\u001b[0m full_backward_hooks, non_full_backward_hooks \u001b[38;5;241m=\u001b[39m [], []\n",
-      "Cell \u001b[0;32mIn[7], line 16\u001b[0m, in \u001b[0;36mMyLightningModule.forward\u001b[0;34m(self, input_ids, attention_mask, labels)\u001b[0m\n\u001b[1;32m     15\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mforward\u001b[39m(\u001b[38;5;28mself\u001b[39m, input_ids, attention_mask, labels\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m):\n\u001b[0;32m---> 16\u001b[0m     output \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mmodel\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m     17\u001b[0m \u001b[43m        \u001b[49m\u001b[43minput_ids\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43minput_ids\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m     18\u001b[0m \u001b[43m        \u001b[49m\u001b[43mattention_mask\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mattention_mask\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m     19\u001b[0m \u001b[43m        \u001b[49m\u001b[43mlabels\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mlabels\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m     20\u001b[0m \u001b[43m    \u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     21\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m output\u001b[38;5;241m.\u001b[39mloss, output\u001b[38;5;241m.\u001b[39mlogits\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/torch/nn/modules/module.py:1194\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *input, **kwargs)\u001b[0m\n\u001b[1;32m   1190\u001b[0m \u001b[38;5;66;03m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m   1191\u001b[0m \u001b[38;5;66;03m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m   1192\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m (\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m   1193\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> 1194\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mforward_call\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;28;43minput\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1195\u001b[0m \u001b[38;5;66;03m# Do not call functions when jit is used\u001b[39;00m\n\u001b[1;32m   1196\u001b[0m full_backward_hooks, non_full_backward_hooks \u001b[38;5;241m=\u001b[39m [], []\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/transformers/models/t5/modeling_t5.py:1624\u001b[0m, in \u001b[0;36mT5ForConditionalGeneration.forward\u001b[0;34m(self, input_ids, attention_mask, decoder_input_ids, decoder_attention_mask, head_mask, decoder_head_mask, cross_attn_head_mask, encoder_outputs, past_key_values, inputs_embeds, decoder_inputs_embeds, labels, use_cache, output_attentions, output_hidden_states, return_dict)\u001b[0m\n\u001b[1;32m   1621\u001b[0m \u001b[38;5;66;03m# Encode if needed (training, first prediction pass)\u001b[39;00m\n\u001b[1;32m   1622\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m encoder_outputs \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[1;32m   1623\u001b[0m     \u001b[38;5;66;03m# Convert encoder inputs in embeddings if needed\u001b[39;00m\n\u001b[0;32m-> 1624\u001b[0m     encoder_outputs \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mencoder\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m   1625\u001b[0m \u001b[43m        \u001b[49m\u001b[43minput_ids\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43minput_ids\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1626\u001b[0m \u001b[43m        \u001b[49m\u001b[43mattention_mask\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mattention_mask\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1627\u001b[0m \u001b[43m        \u001b[49m\u001b[43minputs_embeds\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43minputs_embeds\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1628\u001b[0m \u001b[43m        \u001b[49m\u001b[43mhead_mask\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mhead_mask\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1629\u001b[0m \u001b[43m        \u001b[49m\u001b[43moutput_attentions\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43moutput_attentions\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1630\u001b[0m \u001b[43m        \u001b[49m\u001b[43moutput_hidden_states\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43moutput_hidden_states\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1631\u001b[0m \u001b[43m        \u001b[49m\u001b[43mreturn_dict\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mreturn_dict\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m   1632\u001b[0m \u001b[43m    \u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1633\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m return_dict \u001b[38;5;129;01mand\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(encoder_outputs, BaseModelOutput):\n\u001b[1;32m   1634\u001b[0m     encoder_outputs \u001b[38;5;241m=\u001b[39m BaseModelOutput(\n\u001b[1;32m   1635\u001b[0m         last_hidden_state\u001b[38;5;241m=\u001b[39mencoder_outputs[\u001b[38;5;241m0\u001b[39m],\n\u001b[1;32m   1636\u001b[0m         hidden_states\u001b[38;5;241m=\u001b[39mencoder_outputs[\u001b[38;5;241m1\u001b[39m] \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mlen\u001b[39m(encoder_outputs) \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m1\u001b[39m \u001b[38;5;28;01melse\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m,\n\u001b[1;32m   1637\u001b[0m         attentions\u001b[38;5;241m=\u001b[39mencoder_outputs[\u001b[38;5;241m2\u001b[39m] \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mlen\u001b[39m(encoder_outputs) \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m2\u001b[39m \u001b[38;5;28;01melse\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m,\n\u001b[1;32m   1638\u001b[0m     )\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/torch/nn/modules/module.py:1194\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *input, **kwargs)\u001b[0m\n\u001b[1;32m   1190\u001b[0m \u001b[38;5;66;03m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m   1191\u001b[0m \u001b[38;5;66;03m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m   1192\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m (\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m   1193\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> 1194\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mforward_call\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;28;43minput\u001b[39;49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1195\u001b[0m \u001b[38;5;66;03m# Do not call functions when jit is used\u001b[39;00m\n\u001b[1;32m   1196\u001b[0m full_backward_hooks, non_full_backward_hooks \u001b[38;5;241m=\u001b[39m [], []\n",
-      "File \u001b[0;32m~/.conda/envs/whisper_lightning/lib/python3.10/site-packages/transformers/models/t5/modeling_t5.py:944\u001b[0m, in \u001b[0;36mT5Stack.forward\u001b[0;34m(self, input_ids, attention_mask, encoder_hidden_states, encoder_attention_mask, inputs_embeds, head_mask, cross_attn_head_mask, past_key_values, use_cache, output_attentions, output_hidden_states, return_dict)\u001b[0m\n\u001b[1;32m    940\u001b[0m     \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\n\u001b[1;32m    941\u001b[0m         \u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mYou cannot specify both \u001b[39m\u001b[38;5;132;01m{\u001b[39;00merr_msg_prefix\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124minput_ids and \u001b[39m\u001b[38;5;132;01m{\u001b[39;00merr_msg_prefix\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124minputs_embeds at the same time\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[1;32m    942\u001b[0m     )\n\u001b[1;32m    943\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m input_ids \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[0;32m--> 944\u001b[0m     input_shape \u001b[38;5;241m=\u001b[39m \u001b[43minput_ids\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43msize\u001b[49m()\n\u001b[1;32m    945\u001b[0m     input_ids \u001b[38;5;241m=\u001b[39m input_ids\u001b[38;5;241m.\u001b[39mview(\u001b[38;5;241m-\u001b[39m\u001b[38;5;241m1\u001b[39m, input_shape[\u001b[38;5;241m-\u001b[39m\u001b[38;5;241m1\u001b[39m])\n\u001b[1;32m    946\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m inputs_embeds \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n",
-      "\u001b[0;31mAttributeError\u001b[0m: 'list' object has no attribute 'size'"
-     ]
-    }
-   ],
-   "source": [
-    "torch.set_float32_matmul_precision(\"medium\")\n",
-    "model = MyLightningModule(model_name=\"t5-small\", learning_rate=1e-5, weight_decay=1e-4, batch_size=16)\n",
-    "trainer = pl.Trainer(accelerator=\"gpu\", devices=[0], max_epochs=10)\n",
-    "dm = MyDataModule(batch_size=16)\n",
-    "trainer.fit(model, datamodule=dm)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "aa7b1ab0",
-   "metadata": {},
-   "source": [
-    "### Recap of what we did:\n",
-    "* Finetuned T5-Small on DailyCNN (summarize news articles) using HF Trainer and data loading\n",
-    "* Converted to Lightning code \n",
-    "\n",
-    "### To do next:\n",
-    "* Make it work with the evaluation somethings wrong now, don't think it's a big issue\n",
-    "* Clean up the code a bit\n",
-    "* Compare it with HF, add predict function, modify data loading so it's from scratch / more general way of doing it."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "80a2efab",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.9"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/ML/Pytorch/huggingface/finetuning_t5_small_cnndaily.ipynb b/ML/Pytorch/huggingface/finetuning_t5_small_cnndaily.ipynb
deleted file mode 100644
index 09bebc9..0000000
--- a/ML/Pytorch/huggingface/finetuning_t5_small_cnndaily.ipynb
+++ /dev/null
@@ -1,237 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "5372055b",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from jupyterthemes.stylefx import set_nb_theme\n",
-    "set_nb_theme('chesterish')"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "11214a4a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "os.environ[\"CUDA_DEVICE_ORDER\"]=\"PCI_BUS_ID\"\n",
-    "os.environ[\"CUDA_VISIBLE_DEVICES\"]=\"0\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f45eb6b0",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import numpy as np\n",
-    "import torch\n",
-    "\n",
-    "import datasets \n",
-    "\n",
-    "from datasets import load_dataset, load_metric\n",
-    "\n",
-    "from transformers import (\n",
-    "    AutoModel,\n",
-    "    AutoModelForMaskedLM,\n",
-    "    AutoModelForSeq2SeqLM,\n",
-    "    AutoModelForTokenClassification,\n",
-    "    AutoTokenizer,\n",
-    "    DataCollatorForSeq2Seq,\n",
-    "    pipeline,\n",
-    "    Seq2SeqTrainingArguments,\n",
-    "    Seq2SeqTrainer,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b2d26af4",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load the pre-trained model and tokenizer\n",
-    "model_name = \"t5-small\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(model_name)\n",
-    "model = AutoModelForSeq2SeqLM.from_pretrained(model_name)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "363045f5",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def preprocess_function(batch):\n",
-    "    inputs = tokenizer(batch[\"article\"], padding=\"max_length\", truncation=True, max_length=512)\n",
-    "    outputs = tokenizer(batch[\"highlights\"], padding=\"max_length\", truncation=True, max_length=128)\n",
-    "    batch[\"input_ids\"] = inputs.input_ids\n",
-    "    batch[\"attention_mask\"] = inputs.attention_mask\n",
-    "    batch[\"labels\"] = outputs.input_ids.copy()\n",
-    "    return batch\n",
-    "\n",
-    "# Load the dataset\n",
-    "train_data = load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"train\")\n",
-    "val_data = load_dataset(\"cnn_dailymail\", \"3.0.0\", split=\"validation[:10%]\")\n",
-    "\n",
-    "train_ds = train_data.map(\n",
-    "    preprocess_function, \n",
-    "    batched=True, \n",
-    "    batch_size=256, \n",
-    "    remove_columns=[\"article\", \"highlights\", \"id\"]\n",
-    ")\n",
-    "\n",
-    "val_ds = val_data.map(\n",
-    "    preprocess_function, \n",
-    "    batched=True, \n",
-    "    batch_size=256, \n",
-    "    remove_columns=[\"article\", \"highlights\", \"id\"]\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0d58818f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "class MyLightningModule(pl.LightningModule):\n",
-    "    def __init__(self, model_name, learning_rate, weight_decay, batch_size, num_training_steps):\n",
-    "        super().__init__()\n",
-    "        self.model_name = model_name\n",
-    "        self.learning_rate = learning_rate\n",
-    "        self.weight_decay = weight_decay\n",
-    "        self.batch_size = batch_size\n",
-    "        self.num_training_steps = num_training_steps\n",
-    "        \n",
-    "        # Load the pre-trained model and tokenizer\n",
-    "        self.tokenizer = AutoTokenizer.from_pretrained(self.model_name)\n",
-    "        self.model = AutoModelForSeq2SeqLM.from_pretrained(self.model_name)\n",
-    "\n",
-    "    def forward(self, input_ids, attention_mask, labels=None):\n",
-    "        output = self.model(\n",
-    "            input_ids=input_ids,\n",
-    "            attention_mask=attention_mask,\n",
-    "            labels=labels,\n",
-    "        )\n",
-    "        return output.loss, output.logits\n",
-    "    \n",
-    "    def training_step(self, batch, batch_idx):\n",
-    "        input_ids = batch[\"input_ids\"]\n",
-    "        attention_mask = batch[\"attention_mask\"]\n",
-    "        labels = batch[\"labels\"]\n",
-    "        \n",
-    "        loss\n",
-    "\n",
-    "# Define the data collator\n",
-    "data_collator = DataCollatorForSeq2Seq(tokenizer, model=model)\n",
-    "\n",
-    "# Initialize the trainer arguments\n",
-    "training_args = Seq2SeqTrainingArguments(\n",
-    "    output_dir=\"./results\",\n",
-    "    learning_rate=1e-5,\n",
-    "    per_device_train_batch_size=16,\n",
-    "    per_device_eval_batch_size=16,\n",
-    "    max_steps=5000,\n",
-    "    weight_decay=1e-4,\n",
-    "    push_to_hub=False,\n",
-    "    evaluation_strategy = \"steps\",\n",
-    "    eval_steps = 50,\n",
-    "    generation_max_length=128,\n",
-    "    predict_with_generate=True,\n",
-    "    logging_steps=100,\n",
-    "    gradient_accumulation_steps=1,\n",
-    "    fp16=True,\n",
-    ")\n",
-    "\n",
-    "# Load the ROUGE metric\n",
-    "metric = load_metric(\"rouge\")\n",
-    "\n",
-    "# Define the evaluation function\n",
-    "def compute_metrics(pred):\n",
-    "    labels = pred.label_ids\n",
-    "    preds = pred.predictions\n",
-    "    decoded_preds = tokenizer.batch_decode(preds, skip_special_tokens=True)\n",
-    "    decoded_labels = tokenizer.batch_decode(labels, skip_special_tokens=True)\n",
-    "    scores = metric.compute(predictions=decoded_preds, references=decoded_labels, rouge_types=[\"rouge1\"])[\"rouge1\"].mid\n",
-    "    return {\"rouge1_precision\": scores.precision, \"rouge1_recall\": scores.recall, \"rouge1_fmeasure\": scores.fmeasure}\n",
-    "\n",
-    "\n",
-    "# Initialize the trainer\n",
-    "trainer = Seq2SeqTrainer(\n",
-    "    model=model,\n",
-    "    args=training_args,\n",
-    "    train_dataset=train_data,\n",
-    "    eval_dataset=val_data,\n",
-    "    data_collator=data_collator,\n",
-    "    tokenizer=tokenizer,\n",
-    "    compute_metrics=compute_metrics,\n",
-    ")\n",
-    "\n",
-    "# Start the training\n",
-    "trainer.train()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5148159b",
-   "metadata": {},
-   "source": [
-    "# Steps:\n",
-    "1. Rewrite code to be more general\n",
-    "\n",
-    "a) Data loading should be from disk rather than their load_dataset, and should be on the fly\n",
-    "\n",
-    "b) Rewrite to Lightning code, Trainer etc using Lightning, compute metric fine that we use huggingface"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "95e33e40",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "!nvidia-smi"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "4c0348c2",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.9"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/ML/Pytorch/huggingface/learning.ipynb b/ML/Pytorch/huggingface/learning.ipynb
deleted file mode 100644
index c821b42..0000000
--- a/ML/Pytorch/huggingface/learning.ipynb
+++ /dev/null
@@ -1,644 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": 23,
-   "id": "7d5e92c6",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "[{'entity': 'I-FOOD', 'score': 0.49999642, 'index': 5, 'word': 'Turtle', 'start': 8, 'end': 14}, {'entity': 'I-FOOD', 'score': 0.6096488, 'index': 6, 'word': '##s', 'start': 14, 'end': 15}, {'entity': 'B-FOOD', 'score': 0.45608267, 'index': 7, 'word': 'Original', 'start': 16, 'end': 24}, {'entity': 'I-FOOD', 'score': 0.6613699, 'index': 8, 'word': 'Cara', 'start': 25, 'end': 29}, {'entity': 'I-FOOD', 'score': 0.5776781, 'index': 9, 'word': '##mel', 'start': 29, 'end': 32}, {'entity': 'I-FOOD', 'score': 0.86556953, 'index': 10, 'word': 'Chocolate', 'start': 33, 'end': 42}, {'entity': 'I-FOOD', 'score': 0.96111995, 'index': 11, 'word': 'P', 'start': 43, 'end': 44}, {'entity': 'I-FOOD', 'score': 0.8003402, 'index': 12, 'word': '##eca', 'start': 44, 'end': 47}, {'entity': 'I-FOOD', 'score': 0.9277613, 'index': 13, 'word': '##n', 'start': 47, 'end': 48}, {'entity': 'I-FOOD', 'score': 0.9217512, 'index': 15, 'word': '##luster', 'start': 50, 'end': 56}]\n"
-     ]
-    }
-   ],
-   "source": [
-    "from transformers import AutoTokenizer, AutoModelForTokenClassification\n",
-    "from transformers import pipeline\n",
-    "\n",
-    "tokenizer = AutoTokenizer.from_pretrained(\"Dizex/FoodBaseBERT\")\n",
-    "model = AutoModelForTokenClassification.from_pretrained(\"Dizex/FoodBaseBERT\")\n",
-    "\n",
-    "pipe = pipeline(\"ner\", model=model, tokenizer=tokenizer)\n",
-    "example = \"Demet's Turtles Original Caramel Chocolate Pecan Clusters 9.3 oz Holiday Gift Box\"\n",
-    "\n",
-    "ner_entity_results = pipe(example)\n",
-    "print(ner_entity_results)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 31,
-   "id": "bf67ee76",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Turtle s Original Cara mel Chocolate P eca n luster\n"
-     ]
-    }
-   ],
-   "source": [
-    "ner_entity_results = pipe(example)\n",
-    "\n",
-    "# Initialize the entity words list with an empty string\n",
-    "entity_words = [\"\"]\n",
-    "\n",
-    "# Loop through each dictionary in the list and extract the entity word\n",
-    "for result in ner_entity_results:\n",
-    "    if result[\"entity\"] == \"B-FOOD\":\n",
-    "        entity_words.append(result[\"word\"])\n",
-    "    elif result[\"entity\"] == \"I-FOOD\":\n",
-    "        entity_words[-1] += \" \" + result[\"word\"]\n",
-    "\n",
-    "# Remove any remaining ## symbols and extra spaces\n",
-    "entity_words = [word.replace(\"##\", \"\").strip() for word in entity_words]\n",
-    "\n",
-    "# Join the entity words into a single string\n",
-    "output = \" \".join(entity_words)\n",
-    "\n",
-    "print(output)\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "fc8e5ea0",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import torch\n",
-    "print(torch.cuda.is_available())"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d8a1e039",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import pipeline\n",
-    "import numpy as np"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6ad73024",
-   "metadata": {
-    "scrolled": true
-   },
-   "outputs": [],
-   "source": [
-    "classifier = pipeline(\"zero-shot-classification\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "04f7e02c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "classifier(\n",
-    "    \"This is a course about the Transformers library\",\n",
-    "    candidate_labels=[\"machine learning\", \"gym\", \"food\"],\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6fb246c2",
-   "metadata": {
-    "scrolled": true
-   },
-   "outputs": [],
-   "source": [
-    "from transformers import pipeline\n",
-    "generator = pipeline(task=\"text-generation\", model=\"bigscience/bloom-1b7\", device=0)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "c4e174f0",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import AutoModelForTokenClassification, AutoModel, AutoTokenizer\n",
-    "import torch\n",
-    "\n",
-    "# Define input text and pre-trained model checkpoint\n",
-    "text = \"My name is wolfgang and I live in berlin\"\n",
-    "checkpoint = \"Jean-Baptiste/roberta-large-ner-english\"\n",
-    "\n",
-    "# Instantiate tokenizer and encode input text\n",
-    "tokenizer = AutoTokenizer.from_pretrained(checkpoint)\n",
-    "inputs = tokenizer(text, padding=True, truncation=True, return_tensors=\"pt\")\n",
-    "\n",
-    "# Instantiate model and generate output\n",
-    "model = AutoModel.from_pretrained(checkpoint)\n",
-    "outputs = model(**inputs)\n",
-    "print(outputs[0].shape)\n",
-    "\n",
-    "# Instantiate token classification model and generate predictions\n",
-    "model = AutoModelForTokenClassification.from_pretrained(checkpoint)\n",
-    "outputs = model(**inputs)\n",
-    "predictions = torch.nn.functional.softmax(outputs.logits, dim=-1)\n",
-    "print(predictions)\n",
-    "print(model.config.id2label)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "8212bbaa",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import AutoTokenizer, AutoModelForMaskedLM\n",
-    "\n",
-    "tokenizer = AutoTokenizer.from_pretrained('xlm-roberta-large')\n",
-    "model = AutoModelForMaskedLM.from_pretrained(\"xlm-roberta-large\")\n",
-    "\n",
-    "# prepare input\n",
-    "text = \"Replace me by any text you'd like.\"\n",
-    "encoded_input = tokenizer(text, return_tensors='pt')\n",
-    "\n",
-    "# forward pass\n",
-    "output = model(**encoded_input)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "314cba41",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import AutoTokenizer, AutoModelForMaskedLM\n",
-    "\n",
-    "# Load the pre-trained tokenizer and model\n",
-    "tokenizer = AutoTokenizer.from_pretrained('xlm-roberta-large')\n",
-    "model = AutoModelForMaskedLM.from_pretrained(\"xlm-roberta-large\")\n",
-    "\n",
-    "# Define the input sentence with a masked token\n",
-    "text = \"I want to <mask> a new car tomorrow.\"\n",
-    "\n",
-    "# Tokenize the input sentence, replacing the masked token with a special [MASK] token\n",
-    "encoded_input = tokenizer(text, padding=True, truncation=True, return_tensors='pt')\n",
-    "\n",
-    "print(output.logits.shape)\n",
-    "print(encoded_input['input_ids'][0].tolist().index(tokenizer.mask_token_id))\n",
-    "\n",
-    "# Extract the predicted probabilities for the masked token\n",
-    "predicted_probabilities = output.logits[0, encoded_input['input_ids'][0].tolist().index(tokenizer.mask_token_id)]\n",
-    "predicted_probabilities = torch.nn.functional.softmax(predicted_probabilities, dim=-1)\n",
-    "\n",
-    "# Get the top-k most probable predictions for the masked token\n",
-    "k = 5\n",
-    "top_k = torch.topk(predicted_probabilities, k)\n",
-    "for i in range(k):\n",
-    "    token = tokenizer.convert_ids_to_tokens(top_k.indices[i].item())\n",
-    "    score = top_k.values[i].item()\n",
-    "    print(f\"Prediction {i+1}: '{token}' with probability {score:.5f}\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6187e77e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%%time\n",
-    "tokenizer = AutoTokenizer.from_pretrained(\"bert-base-cased\")\n",
-    "\n",
-    "sequences = [\n",
-    "    \"Using a Transformer network is simple\",\n",
-    "    \"The quick brown fox jumps over the lazy dog\",\n",
-    "    \"To be or not to be, that is the question\"\n",
-    "]\n",
-    "\n",
-    "# Tokenize the input sequences and convert them to padded and truncated integer token IDs\n",
-    "inputs = tokenizer(\n",
-    "    sequences,\n",
-    "    padding=True,\n",
-    "    truncation=True,\n",
-    "    return_tensors=\"pt\"\n",
-    ")\n",
-    "\n",
-    "# Print the resulting input IDs and attention masks\n",
-    "print(inputs['input_ids'])\n",
-    "print(inputs['attention_mask'])"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "fc259c5a",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "markdown",
-   "id": "43466db6",
-   "metadata": {},
-   "source": [
-    "Huggingface:\n",
-    "\n",
-    "1. Understanding how to use the Pipeline (probably most useful) for various tasks, easy to use, and the different subtasks it can do like translation, QA, zero shot, sentiment analysis, token classification, etc. \n",
-    "2. Understood how pipeline works in more detail by using AutoModel for various tasks as well as AutoTokenizer\n",
-    "3. Load dataset\n",
-    "4. How to finetune\n",
-    "5. How to evaluate\n",
-    "6. "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "97c474f2",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "3ed5d8c2",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import torch\n",
-    "from transformers import AdamW, AutoTokenizer, AutoModelForSequenceClassification\n",
-    "\n",
-    "# Same as before\n",
-    "checkpoint = \"bert-base-uncased\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(checkpoint)\n",
-    "model = AutoModelForSequenceClassification.from_pretrained(checkpoint)\n",
-    "sequences = [\n",
-    "    \"I've been waiting for a HuggingFace course my whole life.\",\n",
-    "    \"This course is amazing!\",\n",
-    "]\n",
-    "batch = tokenizer(sequences, padding=True, truncation=True, return_tensors=\"pt\")\n",
-    "\n",
-    "# This is new\n",
-    "batch[\"labels\"] = torch.tensor([1, 1])\n",
-    "\n",
-    "optimizer = AdamW(model.parameters())\n",
-    "loss = model(**batch).loss\n",
-    "loss.backward()\n",
-    "optimizer.step()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "c598624f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from datasets import load_dataset\n",
-    "raw_datasets = load_dataset(\"glue\", \"mrpc\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "cd296227",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "raw_train_dataset = raw_datasets[\"train\"]\n",
-    "raw_train_dataset[0]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e462947a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from datasets import load_dataset\n",
-    "from transformers import AutoTokenizer, DataCollatorWithPadding\n",
-    "raw_datasets = load_dataset(\"glue\", \"mrpc\")\n",
-    "\n",
-    "checkpoint = \"bert-base-uncased\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(checkpoint)\n",
-    "\n",
-    "def tokenize_function(example):\n",
-    "    return tokenizer(example[\"sentence1\"], example[\"sentence2\"], truncation=True)\n",
-    "\n",
-    "\n",
-    "tokenized_datasets = raw_datasets.map(tokenize_function, batched=True)\n",
-    "data_collator = DataCollatorWithPadding(tokenizer=tokenizer)\n",
-    "\n",
-    "\n",
-    "from transformers import TrainingArguments\n",
-    "training_args = TrainingArguments(\"test-trainer\")\n",
-    "\n",
-    "from transformers import AutoModelForSequenceClassification\n",
-    "model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=2)\n",
-    "\n",
-    "import numpy as np\n",
-    "import evaluate\n",
-    "\n",
-    "def compute_metrics(eval_preds):\n",
-    "    metric = evaluate.load(\"glue\", \"mrpc\")\n",
-    "    logits, labels = eval_preds\n",
-    "    predictions = np.argmax(logits, axis=-1)\n",
-    "    return metric.compute(predictions=predictions, references=labels)\n",
-    "\n",
-    "training_args = TrainingArguments(\"test-trainer\", evaluation_strategy=\"epoch\")\n",
-    "model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=2)\n",
-    "\n",
-    "trainer = Trainer(\n",
-    "    model,\n",
-    "    training_args,\n",
-    "    train_dataset=tokenized_datasets[\"train\"],\n",
-    "    eval_dataset=tokenized_datasets[\"validation\"],\n",
-    "    data_collator=data_collator,\n",
-    "    tokenizer=tokenizer,\n",
-    "    compute_metrics=compute_metrics,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0e2795dc",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import TrainingArguments\n",
-    "training_args = TrainingArguments(\"test-trainer\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "3af29cd5",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from transformers import AutoModelForSequenceClassification\n",
-    "model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=2)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "817f644e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import numpy as np\n",
-    "import evaluate"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "42819a6c",
-   "metadata": {
-    "scrolled": true
-   },
-   "outputs": [],
-   "source": [
-    "def compute_metrics(eval_preds):\n",
-    "    metric = evaluate.load(\"glue\", \"mrpc\")\n",
-    "    logits, labels = eval_preds\n",
-    "    predictions = np.argmax(logits, axis=-1)\n",
-    "    return metric.compute(predictions=predictions, references=labels)\n",
-    "\n",
-    "training_args = TrainingArguments(\"test-trainer\", evaluation_strategy=\"epoch\")\n",
-    "model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=2)\n",
-    "\n",
-    "trainer = Trainer(\n",
-    "    model,\n",
-    "    training_args,\n",
-    "    train_dataset=tokenized_datasets[\"train\"],\n",
-    "    eval_dataset=tokenized_datasets[\"validation\"],\n",
-    "    data_collator=data_collator,\n",
-    "    tokenizer=tokenizer,\n",
-    "    compute_metrics=compute_metrics,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "eb5986b0",
-   "metadata": {
-    "scrolled": false
-   },
-   "outputs": [],
-   "source": [
-    "from transformers import AutoModelForSeq2SeqLM, AutoTokenizer, DataCollatorForSeq2Seq, Seq2SeqTrainingArguments, Seq2SeqTrainer\n",
-    "from datasets import load_dataset\n",
-    "batch_size=32\n",
-    "\n",
-    "# Define the generator function to preprocess the data in batches\n",
-    "def preprocess_generator(examples):\n",
-    "    for i in range(0, len(examples[\"article\"]), batch_size):\n",
-    "        batch = examples[\"article\"][i:i+batch_size]\n",
-    "        targets = examples[\"highlights\"][i:i+batch_size]\n",
-    "        model_inputs = tokenizer(batch, max_length=512, padding=\"max_length\", truncation=True)\n",
-    "        with tokenizer.as_target_tokenizer():\n",
-    "            model_targets = tokenizer(targets, max_length=128, padding=\"max_length\", truncation=True)\n",
-    "        model_inputs[\"labels\"] = model_targets[\"input_ids\"]\n",
-    "        yield model_inputs\n",
-    "\n",
-    "def preprocess_function(examples):\n",
-    "    articles = [ex for ex in examples[\"article\"]]\n",
-    "    summaries = [ex for ex in examples[\"highlights\"]]\n",
-    "\n",
-    "    model_inputs = tokenizer(articles, max_length=512, padding=\"max_length\", truncation=True)\n",
-    "    with tokenizer.as_target_tokenizer():\n",
-    "        model_targets = tokenizer(summaries, max_length=128, padding=\"max_length\", truncation=True)\n",
-    "    \n",
-    "    model_inputs[\"labels\"] = model_targets[\"input_ids\"]\n",
-    "    return model_inputs\n",
-    "    \n",
-    "# Load the dataset\n",
-    "raw_datasets = load_dataset(\"cnn_dailymail\", \"3.0.0\")\n",
-    "preprocessed_datasets = raw_datasets.map(preprocess_function, batched=True, num_proc=4)\n",
-    "\n",
-    "# Load the pre-trained model and tokenizer\n",
-    "model_name = \"t5-small\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(model_name)\n",
-    "model = AutoModelForSeq2SeqLM.from_pretrained(model_name)\n",
-    "\n",
-    "# Define the data collator\n",
-    "data_collator = DataCollatorForSeq2Seq(tokenizer, model=model)\n",
-    "\n",
-    "# Initialize the trainer arguments\n",
-    "training_args = Seq2SeqTrainingArguments(\n",
-    "    output_dir=\"./results\",\n",
-    "    evaluation_strategy = \"epoch\",\n",
-    "    learning_rate=2e-5,\n",
-    "    per_device_train_batch_size=batch_size,\n",
-    "    max_steps=1000,\n",
-    "    weight_decay=0.01,\n",
-    "    push_to_hub=False,\n",
-    ")\n",
-    "\n",
-    "# Initialize the trainer\n",
-    "trainer = Seq2SeqTrainer(\n",
-    "    model=model,\n",
-    "    args=training_args,\n",
-    "    train_dataset=train_ds,\n",
-    "    data_collator=data_collator,\n",
-    "    tokenizer=tokenizer,\n",
-    ")\n",
-    "\n",
-    "# Start the training\n",
-    "trainer.train()\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7d62583e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from datasets import load_metric"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d310a7b3",
-   "metadata": {
-    "scrolled": true
-   },
-   "outputs": [],
-   "source": [
-    "preprocessed_datasets"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "99d422cc",
-   "metadata": {
-    "scrolled": false
-   },
-   "outputs": [],
-   "source": [
-    "# Load the pre-trained model and tokenizer\n",
-    "model_name = \"t5-small\"\n",
-    "tokenizer = AutoTokenizer.from_pretrained(model_name)\n",
-    "model = AutoModelForSeq2SeqLM.from_pretrained(model_name)\n",
-    "\n",
-    "# Define the data collator\n",
-    "data_collator = DataCollatorForSeq2Seq(tokenizer, model=model)\n",
-    "\n",
-    "# Initialize the trainer arguments\n",
-    "training_args = Seq2SeqTrainingArguments(\n",
-    "    output_dir=\"./results\",\n",
-    "    learning_rate=2e-5,\n",
-    "    per_device_train_batch_size=batch_size,\n",
-    "    max_steps=5000,\n",
-    "    weight_decay=0.01,\n",
-    "    push_to_hub=False,\n",
-    "    evaluation_strategy = \"steps\",\n",
-    "    eval_steps = 50,\n",
-    ")\n",
-    "\n",
-    "# Load the ROUGE metric\n",
-    "metric = load_metric(\"rouge\")\n",
-    "\n",
-    "# Define the evaluation function\n",
-    "def compute_metrics(pred):\n",
-    "    labels = pred.label_ids\n",
-    "    preds = pred.predictions\n",
-    "    \n",
-    "    decoded_preds = tokenizer.batch_decode(preds, skip_special_tokens=True)\n",
-    "    decoded_labels = tokenizer.batch_decode(labels, skip_special_tokens=True)\n",
-    "    \n",
-    "    scores = metric.compute(predictions=decoded_preds, references=decoded_labels, rouge_types=[\"rouge1\"])[\"rouge1\"].mid\n",
-    "    \n",
-    "    return {\"rouge1_precision\": scores.precision, \"rouge1_recall\": scores.recall, \"rouge1_fmeasure\": scores.fmeasure}\n",
-    "\n",
-    "\n",
-    "# Initialize the trainer\n",
-    "trainer = Seq2SeqTrainer(\n",
-    "    model=model,\n",
-    "    args=training_args,\n",
-    "    train_dataset=preprocessed_datasets[\"train\"],\n",
-    "    eval_dataset=preprocessed_datasets[\"validation\"],\n",
-    "    data_collator=data_collator,\n",
-    "    tokenizer=tokenizer,\n",
-    "    compute_metrics=compute_metrics,\n",
-    ")\n",
-    "\n",
-    "# Start the training\n",
-    "trainer.train()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "a5e97b57",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "!pip install nltk\n",
-    "!pip install rouge_score"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "558c3e66",
-   "metadata": {},
-   "source": [
-    "# Goal:\n",
-    "\n",
-    "1. Implement full training from dataloading (dailycnn dataset), to model training, evaluation, etc, using HF. \n",
-    "* Right now: stuck on on the fly dataset loading, we don't want to cache because this would take a lot of disk space etc.\n",
-    "\n",
-    "2. After we get step 1) working, we want to go deeper on every step, so download the dataset and load it as a custom dataset rather than using huggingface simple API, in order to make it more general. Compare with loading the ds as a custom HF dataset or using pytorch class together with lightning. Speed difference? Convenience? Also we want to use the lightning Trainer so see how we can integrate that. And then compare HF to the lightning + hf model approach and see what we like the most."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "624d49ca",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.9"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/ML/Pytorch/huggingface/learninghugg.py b/ML/Pytorch/huggingface/learninghugg.py
deleted file mode 100644
index 236cf3b..0000000
--- a/ML/Pytorch/huggingface/learninghugg.py
+++ /dev/null
@@ -1,41 +0,0 @@
-from datasets import load_dataset
-from transformers import AutoTokenizer, DataCollatorWithPadding
-from transformers import Trainer
-
-raw_datasets = load_dataset("glue", "mrpc")
-checkpoint = "bert-base-uncased"
-tokenizer = AutoTokenizer.from_pretrained(checkpoint)
-
-
-def tokenize_function(example):
-    return tokenizer(example["sentence1"], example["sentence2"], truncation=True)
-
-
-tokenized_datasets = raw_datasets.map(tokenize_function, batched=True)
-data_collator = DataCollatorWithPadding(tokenizer=tokenizer)
-
-
-from transformers import TrainingArguments
-training_args = TrainingArguments("test-trainer")
-
-from transformers import AutoModelForSequenceClassification
-model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=2)
-
-def compute_metrics(eval_preds):
-    metric = evaluate.load("glue", "mrpc")
-    logits, labels = eval_preds
-    predictions = np.argmax(logits, axis=-1)
-    return metric.compute(predictions=predictions, references=labels)
-
-training_args = TrainingArguments("test-trainer", evaluation_strategy="epoch")
-model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=2)
-
-trainer = Trainer(
-    model,
-    training_args,
-    train_dataset=tokenized_datasets["train"],
-    eval_dataset=tokenized_datasets["validation"],
-    data_collator=data_collator,
-    tokenizer=tokenizer,
-    compute_metrics=compute_metrics,
-)
diff --git a/ML/Pytorch/huggingface/lightning_logs/version_0/events.out.tfevents.1676993704.mrbeast.566861.0 b/ML/Pytorch/huggingface/lightning_logs/version_0/events.out.tfevents.1676993704.mrbeast.566861.0
deleted file mode 100644
index ab84c26..0000000
Binary files a/ML/Pytorch/huggingface/lightning_logs/version_0/events.out.tfevents.1676993704.mrbeast.566861.0 and /dev/null differ
diff --git a/ML/Pytorch/huggingface/lightning_logs/version_0/hparams.yaml b/ML/Pytorch/huggingface/lightning_logs/version_0/hparams.yaml
deleted file mode 100644
index 0967ef4..0000000
--- a/ML/Pytorch/huggingface/lightning_logs/version_0/hparams.yaml
+++ /dev/null
@@ -1 +0,0 @@
-{}
diff --git a/ML/Pytorch/huggingface/lightning_logs/version_1/events.out.tfevents.1676993775.mrbeast.568809.0 b/ML/Pytorch/huggingface/lightning_logs/version_1/events.out.tfevents.1676993775.mrbeast.568809.0
deleted file mode 100644
index 9ac0e2a..0000000
Binary files a/ML/Pytorch/huggingface/lightning_logs/version_1/events.out.tfevents.1676993775.mrbeast.568809.0 and /dev/null differ
diff --git a/ML/Pytorch/huggingface/lightning_logs/version_1/hparams.yaml b/ML/Pytorch/huggingface/lightning_logs/version_1/hparams.yaml
deleted file mode 100644
index 0967ef4..0000000
--- a/ML/Pytorch/huggingface/lightning_logs/version_1/hparams.yaml
+++ /dev/null
@@ -1 +0,0 @@
-{}
diff --git a/ML/Pytorch/huggingface/lightning_logs/version_2/events.out.tfevents.1676993814.mrbeast.570170.0 b/ML/Pytorch/huggingface/lightning_logs/version_2/events.out.tfevents.1676993814.mrbeast.570170.0
deleted file mode 100644
index 256eb1d..0000000
Binary files a/ML/Pytorch/huggingface/lightning_logs/version_2/events.out.tfevents.1676993814.mrbeast.570170.0 and /dev/null differ
diff --git a/ML/Pytorch/huggingface/lightning_logs/version_2/hparams.yaml b/ML/Pytorch/huggingface/lightning_logs/version_2/hparams.yaml
deleted file mode 100644
index 0967ef4..0000000
--- a/ML/Pytorch/huggingface/lightning_logs/version_2/hparams.yaml
+++ /dev/null
@@ -1 +0,0 @@
-{}
diff --git a/ML/Pytorch/huggingface/lightning_logs/version_3/events.out.tfevents.1676993905.mrbeast.570170.1 b/ML/Pytorch/huggingface/lightning_logs/version_3/events.out.tfevents.1676993905.mrbeast.570170.1
deleted file mode 100644
index a60d00b..0000000
Binary files a/ML/Pytorch/huggingface/lightning_logs/version_3/events.out.tfevents.1676993905.mrbeast.570170.1 and /dev/null differ
diff --git a/ML/Pytorch/huggingface/lightning_logs/version_3/hparams.yaml b/ML/Pytorch/huggingface/lightning_logs/version_3/hparams.yaml
deleted file mode 100644
index 0967ef4..0000000
--- a/ML/Pytorch/huggingface/lightning_logs/version_3/hparams.yaml
+++ /dev/null
@@ -1 +0,0 @@
-{}
diff --git a/ML/Pytorch/huggingface/model.py b/ML/Pytorch/huggingface/model.py
deleted file mode 100644
index e7b2eb1..0000000
--- a/ML/Pytorch/huggingface/model.py
+++ /dev/null
@@ -1,130 +0,0 @@
-import torch
-import pytorch_lightning as pl
-from datasets import load_dataset, load_metric
-from transformers import T5Config, T5ForConditionalGeneration
-
-from transformers import (
-    AutoModel,
-    AutoModelForSeq2SeqLM,
-    AutoTokenizer,
-    DataCollatorForSeq2Seq,
-    Seq2SeqTrainingArguments,
-    Seq2SeqTrainer,
-)
-
-
-class MyLightningModule(pl.LightningModule):
-    def __init__(self, model_name, learning_rate, weight_decay):
-        super().__init__()
-        self.model_name = model_name
-        self.learning_rate = learning_rate
-        self.weight_decay = weight_decay
-        self.tokenizer = AutoTokenizer.from_pretrained(model_name)
-
-        # Load the pre-trained model and tokenizer
-        #self.model = torch.compile(
-        #    AutoModelForSeq2SeqLM.from_pretrained(self.model_name)
-        #)
-
-        # Create a T5-small configuration
-        config = T5Config.from_pretrained("t5-small")
-
-        # Initialize the T5 model with random weights
-        self.model = torch.compile(T5ForConditionalGeneration(config))
-
-        # Load the ROUGE metric
-        self.metric = load_metric("rouge")
-        self.logits = []
-        self.labels = []
-
-    def forward(self, input_ids, attention_mask, labels=None):
-        output = self.model(
-            input_ids=input_ids,
-            attention_mask=attention_mask,
-            labels=labels,
-        )
-        return output.loss, output.logits
-
-    def training_step(self, batch, batch_idx):
-        input_ids = batch["input_ids"]
-        attention_mask = batch["attention_mask"]
-        labels = batch["labels"]
-        loss, logits = self(input_ids, attention_mask, labels)
-        self.log("train_loss", loss, on_epoch=True, on_step=True, prog_bar=True)
-        return {"loss": loss, "logits": logits}
-
-    def validation_step(self, batch, batch_idx):
-        input_ids = batch["input_ids"]
-        attention_mask = batch["attention_mask"]
-        labels = batch["labels"]
-        loss, logits = self(input_ids, attention_mask, labels)
-        self.log("val_loss", loss, on_epoch=True, on_step=False)
-
-        # add logits and labels to instance attributes, but make sure to detach them
-        # from the computational graph first
-        self.logits.append(logits.argmax(dim=-1).detach().cpu())
-        self.labels.append(labels.detach().cpu())
-        return {"loss": loss, "logits": logits, "labels": labels}
-
-    def on_validation_epoch_end(self):
-        # Concatenate tensors in logits and labels lists
-        pred_token_ids = torch.cat(self.logits, dim=0)
-        true_labels = torch.cat(self.labels, dim=0)
-
-        # Decode predictions and labels using the saved instance attributes
-        decoded_preds = self.tokenizer.batch_decode(
-            pred_token_ids, skip_special_tokens=True
-        )
-        decoded_labels = self.tokenizer.batch_decode(
-            true_labels, skip_special_tokens=True
-        )
-
-        # Compute ROUGE scores
-        scores = self.metric.compute(
-            predictions=decoded_preds, references=decoded_labels, rouge_types=["rouge1"]
-        )["rouge1"].mid
-
-        self.log("rouge1_precision", scores.precision, prog_bar=True)
-        self.log("rouge1_recall", scores.recall, prog_bar=True)
-        self.log("rouge1_fmeasure", scores.fmeasure, prog_bar=True)
-
-        # Clear logits and labels instance attributes for the next validation epoch
-        self.logits.clear()
-        self.labels.clear()
-
-    def predict(self, article: str, max_input_length: int = 512, max_output_length: int = 150) -> str:
-        # Set the model to evaluation mode
-        self.model.eval()
-
-        # Tokenize the input article
-        inputs = self.tokenizer(
-            article,
-            max_length=max_input_length,
-            padding="max_length",
-            truncation=True,
-            return_tensors="pt"
-        )
-
-        # Move the input tensors to the same device as the model
-        inputs = {key: value.to(self.device) for key, value in inputs.items()}
-
-        # Generate summary
-        with torch.no_grad():
-            output = self.model.generate(
-                input_ids=inputs["input_ids"],
-                attention_mask=inputs["attention_mask"],
-                max_length=max_output_length,
-                num_return_sequences=1,
-            )
-
-        # Decode and return the summary
-        summary = self.tokenizer.decode(output[0], skip_special_tokens=True)
-        return summary
-
-    def configure_optimizers(self):
-        optimizer = torch.optim.AdamW(
-            self.parameters(), lr=self.learning_rate, weight_decay=self.weight_decay
-        )
-        return optimizer
-
-
diff --git a/ML/Pytorch/huggingface/test.py b/ML/Pytorch/huggingface/test.py
deleted file mode 100644
index dd1f9d8..0000000
--- a/ML/Pytorch/huggingface/test.py
+++ /dev/null
@@ -1,2 +0,0 @@
-l = ["cat", "dog"]
-sentence = "The quick brown fox jumps over the lazy dog"
diff --git a/ML/Pytorch/huggingface/train.py b/ML/Pytorch/huggingface/train.py
deleted file mode 100644
index 6b5a91f..0000000
--- a/ML/Pytorch/huggingface/train.py
+++ /dev/null
@@ -1,67 +0,0 @@
-from dataset import MyDataModule
-from model import MyLightningModule
-import pytorch_lightning as pl
-from pytorch_lightning import Trainer
-from pytorch_lightning.callbacks import ModelCheckpoint
-from pytorch_lightning.loggers import TensorBoardLogger
-from transformers import (
-    AutoModel,
-    AutoModelForSeq2SeqLM,
-    AutoTokenizer,
-    DataCollatorForSeq2Seq,
-    Seq2SeqTrainingArguments,
-    Seq2SeqTrainer,
-)
-import torch
-
-torch.set_float32_matmul_precision("medium")
-
-if __name__ == "__main__":
-    # Define the checkpoint callback
-    checkpoint_callback = ModelCheckpoint(
-        monitor="val_loss",
-        dirpath="checkpoints",
-        filename="my_model-{epoch:02d}-{val_loss:.2f}",
-        save_top_k=-1,
-        every_n_epochs=1,
-        verbose=True,
-    )
-    logger = TensorBoardLogger("tb_logs", name="t5_dailymail")
-
-    model_name = "t5-small"
-    tokenizer = AutoTokenizer.from_pretrained(model_name)
-
-    # File paths
-    train_csv = "train.csv"
-    val_csv = "validation.csv"
-    test_csv = "test.csv"
-
-    # Create the data module
-    dm = MyDataModule(train_csv, val_csv, test_csv, tokenizer, batch_size=32)
-    dm.setup()
-
-    model = MyLightningModule(
-        model_name="t5-small", learning_rate=1e-4, weight_decay=1e-5
-    )
-
-
-    #checkpoint_path = "checkpoints/curr.ckpt"
-    #checkpoint = torch.load(checkpoint_path)
-    #model.load_state_dict(checkpoint["state_dict"])
-
-    trainer = pl.Trainer(
-        accelerator="gpu",
-        devices=[0, 1],
-        max_epochs=10,
-        precision=16,
-        logger=logger,
-        callbacks=[checkpoint_callback],
-        log_every_n_steps=10,
-    )
-    trainer.fit(model, dm)
-    trainer.validate(model, dm)
-    
-    #example = """Former President Donald Trump claims in a social media post that he will be arrested next week. The claim comes while a New York prosecutor considers charging Trump in connection with hush money paid to adult film actress Stormy Daniels but there has been no official announcement of any plans for an indictment. What we know about Trump possibly facing criminal indictment in New York City. Trump has been entangled in several criminal investigations but the case related to Daniels is the longest-running of all of them, reaching back to 2016. On his platform Truth Social on Saturday morning, Trump cited "illegal leaks" that he will be arrested Tuesday and he called for protests. Trump, who is running for president in 2024, also defended himself, saying that he has not committed a crime — though he did not disclose what he expects to be charged with — and he accused the Manhattan District Attorney's Office of being "corrupt & highly political.". 'I'M BACK!' Trump posts on Facebook, YouTube for first time in two years. The Manhattan District Attorney's Office declined to comment on whether it will soon be pursing an arrest warrant for Trump. But the Associated Press reported that law enforcement officials in New York are discussing security preparations in anticipation that Trump may be indicted in coming weeks. If it does occur, Trump would become the first former president to be indicted in U.S. history.""" 
-    #print(len(tokenizer(example)["input_ids"]))
-    #summary = model.predict(example)
-    #print(summary)