Skip to content

Instantly share code, notes, and snippets.

@travishsu
Created May 12, 2022 09:03
Show Gist options
  • Save travishsu/33087a6165f9e2f475c7783e659629f1 to your computer and use it in GitHub Desktop.
Save travishsu/33087a6165f9e2f475c7783e659629f1 to your computer and use it in GitHub Desktop.
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Dependencies"
]
},
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
"import os\n",
"import pandas as pd\n",
"import tqdm\n",
"import math\n",
"import sqlite3\n",
"\n",
"os.environ['CUDA_LAUNCH_BLOCKING'] = '1'\n",
"os.environ['TOKENIZERS_PARALLELISM'] = 'true'"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [],
"source": [
"tokenizer_folder = \"tokenizer\""
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [],
"source": [
"# def sqlite_to_df(db_path, db_name=\"patent\"):\n",
"# conn = sqlite3.connect(db_path)\n",
"# df = pd.read_sql(f\"SELECT * FROM {db_name}\", conn)\n",
"# conn.close()\n",
"# return df\n",
"\n",
"# df = sqlite_to_df(\"/home/alfos/workspace/darpa/darpa-topic-modeling/models/patent_large.db\")\n",
"\n",
"# df = df.assign(text_id=df.apply(lambda row: row.patent_number + '_' + row.section, axis=1))\n",
"\n",
"# patent_text = df.groupby(\"text_id\").text.transform(lambda txt: \" \".join(txt))\n",
"# df = df.assign(patent_text=patent_text)\n",
"# df = df.drop_duplicates(\"text_id\").reset_index(drop=True)\n",
"# df = df[['cpcs', 'title', 'patent_number', 'section', 'patent_text']]\n",
"\n",
"# train = df.sample(frac=0.8)\n",
"# test = df[~df.index.isin(train.index)]\n",
"\n",
"# train.to_csv(\"data/train.csv\", index=False)\n",
"# test.to_csv(\"data/test.csv\", index=False)"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Num Train Examples: 77174\n",
"Num Test Examples: 19294\n"
]
}
],
"source": [
"train = pd.read_csv(\"data/train.csv\")\n",
"test = pd.read_csv(\"data/test.csv\")\n",
"\n",
"print(f\"Num Train Examples: {len(train)}\")\n",
"print(f\"Num Test Examples: {len(test)}\")"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Build a Tokenizer\n",
"### Create the dataset to train a tokenizer"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [],
"source": [
"txt_files_dir = \"./text_split\"\n",
"!rm -rf {txt_files_dir}\n",
"!mkdir {txt_files_dir}"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [],
"source": [
"def column_to_files(column, prefix, txt_files_dir):\n",
" # The prefix is a unique ID to avoid to overwrite a text file\n",
" i = prefix\n",
" # For every value in the df, with just one column\n",
" for row in column.to_list():\n",
" # Create the filename using the prefix ID\n",
" file_name = os.path.join(txt_files_dir, str(i) + '.txt')\n",
"\n",
" try:\n",
" # Create the file and write the column text to it\n",
" f = open(file_name, \"wb\")\n",
" f.write(row.encode(\"utf-8\"))\n",
" f.close()\n",
" except Exception as e:\n",
" print(row, e)\n",
" i += 1\n",
" # Return the last prefix ID\n",
" return i"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"77174\n"
]
}
],
"source": [
"data = train['patent_text']\n",
"\n",
"# Set the ID to 0\n",
"prefix = 0\n",
"# Create a file for every patent text in train\n",
"prefix = column_to_files(data, prefix, txt_files_dir)\n",
"# Print the last ID\n",
"print(prefix)"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"96468\n"
]
}
],
"source": [
"data = test['patent_text']\n",
"\n",
"# Create a file for every patent text in test\n",
"prefix = column_to_files(data, prefix, txt_files_dir)\n",
"# Print the last ID\n",
"print(prefix)"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>cpcs</th>\n",
" <th>title</th>\n",
" <th>patent_number</th>\n",
" <th>section</th>\n",
" <th>patent_text</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>G06F 16/2365,G06F 16/128,G06F 16/24561</td>\n",
" <td>Methods, apparatuses, and systems for ingestin...</td>\n",
" <td>US11269856B2</td>\n",
" <td>background</td>\n",
" <td>The inventors have discovered limitations with...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>C12N 9/0042</td>\n",
" <td>Recombinant vector and method for producing re...</td>\n",
" <td>US11236309B2</td>\n",
" <td>abstract</td>\n",
" <td>A recombinant vector according to an embodimen...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>C23C 16/345,B01J 29/40,C23C 16/0254,C23C 16/36...</td>\n",
" <td>Processes for depositing silicon-containing fi...</td>\n",
" <td>US11268190B2</td>\n",
" <td>summary</td>\n",
" <td>Described herein are halidosilane compounds, p...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>F24F 7/10,E04B 1/7069,E04B 1/72,F24F 7/02,F24F...</td>\n",
" <td>Systems and methods for controlling air proper...</td>\n",
" <td>US11248814B2</td>\n",
" <td>abstract</td>\n",
" <td>A structure comprises at least one outer wall ...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>G06F 16/2379,G06F 16/221,G06F 16/2455</td>\n",
" <td>Scalable implementations of exact distinct cou...</td>\n",
" <td>US11263202B2</td>\n",
" <td>abstract</td>\n",
" <td>Scalable implementations of exact distinct cou...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>77169</th>\n",
" <td>B65D 19/0012,B65D 2519/00019,B65D 2519/00034,B...</td>\n",
" <td>Stackable pallet display</td>\n",
" <td>US11267609B2</td>\n",
" <td>background</td>\n",
" <td>The packaging industry is always striving to i...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>77170</th>\n",
" <td>A01J 25/02,A01J 25/115,A01J 25/15,A47J 27/004,...</td>\n",
" <td>Countertop cooking appliance</td>\n",
" <td>US11259497B2</td>\n",
" <td>abstract</td>\n",
" <td>A countertop cooking appliance is an apparatus...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>77171</th>\n",
" <td>H04B 7/0626,H04B 7/0617,H04B 7/0857,H04B 17/336</td>\n",
" <td>Coordinated beamforming of transmitting nodes ...</td>\n",
" <td>US11251850B1</td>\n",
" <td>background</td>\n",
" <td>Wireless mesh networks include a collection of...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>77172</th>\n",
" <td>G09G 5/14,G09G 2320/0247,G09G 2320/0673</td>\n",
" <td>Electronic device and method for driving displ...</td>\n",
" <td>US11238832B2</td>\n",
" <td>summary</td>\n",
" <td>In displaying a screen on a display in a recen...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>77173</th>\n",
" <td>G06Q 20/3227,G06Q 20/206,G06Q 30/0603,G06Q 30/...</td>\n",
" <td>Mobile cart reconciliation</td>\n",
" <td>US11244301B2</td>\n",
" <td>abstract</td>\n",
" <td>Disclosed herein is a method where a consumer ...</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>77174 rows × 5 columns</p>\n",
"</div>"
],
"text/plain": [
" cpcs \\\n",
"0 G06F 16/2365,G06F 16/128,G06F 16/24561 \n",
"1 C12N 9/0042 \n",
"2 C23C 16/345,B01J 29/40,C23C 16/0254,C23C 16/36... \n",
"3 F24F 7/10,E04B 1/7069,E04B 1/72,F24F 7/02,F24F... \n",
"4 G06F 16/2379,G06F 16/221,G06F 16/2455 \n",
"... ... \n",
"77169 B65D 19/0012,B65D 2519/00019,B65D 2519/00034,B... \n",
"77170 A01J 25/02,A01J 25/115,A01J 25/15,A47J 27/004,... \n",
"77171 H04B 7/0626,H04B 7/0617,H04B 7/0857,H04B 17/336 \n",
"77172 G09G 5/14,G09G 2320/0247,G09G 2320/0673 \n",
"77173 G06Q 20/3227,G06Q 20/206,G06Q 30/0603,G06Q 30/... \n",
"\n",
" title patent_number \\\n",
"0 Methods, apparatuses, and systems for ingestin... US11269856B2 \n",
"1 Recombinant vector and method for producing re... US11236309B2 \n",
"2 Processes for depositing silicon-containing fi... US11268190B2 \n",
"3 Systems and methods for controlling air proper... US11248814B2 \n",
"4 Scalable implementations of exact distinct cou... US11263202B2 \n",
"... ... ... \n",
"77169 Stackable pallet display US11267609B2 \n",
"77170 Countertop cooking appliance US11259497B2 \n",
"77171 Coordinated beamforming of transmitting nodes ... US11251850B1 \n",
"77172 Electronic device and method for driving displ... US11238832B2 \n",
"77173 Mobile cart reconciliation US11244301B2 \n",
"\n",
" section patent_text \n",
"0 background The inventors have discovered limitations with... \n",
"1 abstract A recombinant vector according to an embodimen... \n",
"2 summary Described herein are halidosilane compounds, p... \n",
"3 abstract A structure comprises at least one outer wall ... \n",
"4 abstract Scalable implementations of exact distinct cou... \n",
"... ... ... \n",
"77169 background The packaging industry is always striving to i... \n",
"77170 abstract A countertop cooking appliance is an apparatus... \n",
"77171 background Wireless mesh networks include a collection of... \n",
"77172 summary In displaying a screen on a display in a recen... \n",
"77173 abstract Disclosed herein is a method where a consumer ... \n",
"\n",
"[77174 rows x 5 columns]"
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"train"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Train the tokenizer"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Requirement already satisfied: transformers in ./env/lib/python3.9/site-packages (4.18.0)\n",
"Requirement already satisfied: regex!=2019.12.17 in ./env/lib/python3.9/site-packages (from transformers) (2022.4.24)\n",
"Requirement already satisfied: tqdm>=4.27 in ./env/lib/python3.9/site-packages (from transformers) (4.64.0)\n",
"Requirement already satisfied: sacremoses in ./env/lib/python3.9/site-packages (from transformers) (0.0.53)\n",
"Requirement already satisfied: requests in ./env/lib/python3.9/site-packages (from transformers) (2.27.1)\n",
"Requirement already satisfied: pyyaml>=5.1 in ./env/lib/python3.9/site-packages (from transformers) (6.0)\n",
"Requirement already satisfied: numpy>=1.17 in ./env/lib/python3.9/site-packages (from transformers) (1.22.3)\n",
"Requirement already satisfied: tokenizers!=0.11.3,<0.13,>=0.11.1 in ./env/lib/python3.9/site-packages (from transformers) (0.12.1)\n",
"Requirement already satisfied: filelock in ./env/lib/python3.9/site-packages (from transformers) (3.6.0)\n",
"Requirement already satisfied: huggingface-hub<1.0,>=0.1.0 in ./env/lib/python3.9/site-packages (from transformers) (0.5.1)\n",
"Requirement already satisfied: packaging>=20.0 in ./env/lib/python3.9/site-packages (from transformers) (21.3)\n",
"Requirement already satisfied: typing-extensions>=3.7.4.3 in ./env/lib/python3.9/site-packages (from huggingface-hub<1.0,>=0.1.0->transformers) (4.2.0)\n",
"Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in ./env/lib/python3.9/site-packages (from packaging>=20.0->transformers) (3.0.9)\n",
"Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./env/lib/python3.9/site-packages (from requests->transformers) (1.26.9)\n",
"Requirement already satisfied: certifi>=2017.4.17 in ./env/lib/python3.9/site-packages (from requests->transformers) (2021.10.8)\n",
"Requirement already satisfied: charset-normalizer~=2.0.0 in ./env/lib/python3.9/site-packages (from requests->transformers) (2.0.12)\n",
"Requirement already satisfied: idna<4,>=2.5 in ./env/lib/python3.9/site-packages (from requests->transformers) (3.3)\n",
"Requirement already satisfied: six in ./env/lib/python3.9/site-packages (from sacremoses->transformers) (1.16.0)\n",
"Requirement already satisfied: click in ./env/lib/python3.9/site-packages (from sacremoses->transformers) (8.1.3)\n",
"Requirement already satisfied: joblib in ./env/lib/python3.9/site-packages (from sacremoses->transformers) (1.1.0)\n",
"Requirement already satisfied: datasets in ./env/lib/python3.9/site-packages (2.2.0)\n",
"Requirement already satisfied: dill in ./env/lib/python3.9/site-packages (from datasets) (0.3.4)\n",
"Requirement already satisfied: packaging in ./env/lib/python3.9/site-packages (from datasets) (21.3)\n",
"Requirement already satisfied: xxhash in ./env/lib/python3.9/site-packages (from datasets) (3.0.0)\n",
"Requirement already satisfied: responses<0.19 in ./env/lib/python3.9/site-packages (from datasets) (0.18.0)\n",
"Requirement already satisfied: numpy>=1.17 in ./env/lib/python3.9/site-packages (from datasets) (1.22.3)\n",
"Requirement already satisfied: pyarrow>=6.0.0 in ./env/lib/python3.9/site-packages (from datasets) (8.0.0)\n",
"Requirement already satisfied: fsspec[http]>=2021.05.0 in ./env/lib/python3.9/site-packages (from datasets) (2022.3.0)\n",
"Requirement already satisfied: huggingface-hub<1.0.0,>=0.1.0 in ./env/lib/python3.9/site-packages (from datasets) (0.5.1)\n",
"Requirement already satisfied: requests>=2.19.0 in ./env/lib/python3.9/site-packages (from datasets) (2.27.1)\n",
"Requirement already satisfied: pandas in ./env/lib/python3.9/site-packages (from datasets) (1.4.2)\n",
"Requirement already satisfied: aiohttp in ./env/lib/python3.9/site-packages (from datasets) (3.8.1)\n",
"Requirement already satisfied: tqdm>=4.62.1 in ./env/lib/python3.9/site-packages (from datasets) (4.64.0)\n",
"Requirement already satisfied: multiprocess in ./env/lib/python3.9/site-packages (from datasets) (0.70.12.2)\n",
"Requirement already satisfied: typing-extensions>=3.7.4.3 in ./env/lib/python3.9/site-packages (from huggingface-hub<1.0.0,>=0.1.0->datasets) (4.2.0)\n",
"Requirement already satisfied: pyyaml in ./env/lib/python3.9/site-packages (from huggingface-hub<1.0.0,>=0.1.0->datasets) (6.0)\n",
"Requirement already satisfied: filelock in ./env/lib/python3.9/site-packages (from huggingface-hub<1.0.0,>=0.1.0->datasets) (3.6.0)\n",
"Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in ./env/lib/python3.9/site-packages (from packaging->datasets) (3.0.9)\n",
"Requirement already satisfied: certifi>=2017.4.17 in ./env/lib/python3.9/site-packages (from requests>=2.19.0->datasets) (2021.10.8)\n",
"Requirement already satisfied: idna<4,>=2.5 in ./env/lib/python3.9/site-packages (from requests>=2.19.0->datasets) (3.3)\n",
"Requirement already satisfied: urllib3<1.27,>=1.21.1 in ./env/lib/python3.9/site-packages (from requests>=2.19.0->datasets) (1.26.9)\n",
"Requirement already satisfied: charset-normalizer~=2.0.0 in ./env/lib/python3.9/site-packages (from requests>=2.19.0->datasets) (2.0.12)\n",
"Requirement already satisfied: attrs>=17.3.0 in ./env/lib/python3.9/site-packages (from aiohttp->datasets) (21.4.0)\n",
"Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in ./env/lib/python3.9/site-packages (from aiohttp->datasets) (4.0.2)\n",
"Requirement already satisfied: frozenlist>=1.1.1 in ./env/lib/python3.9/site-packages (from aiohttp->datasets) (1.3.0)\n",
"Requirement already satisfied: multidict<7.0,>=4.5 in ./env/lib/python3.9/site-packages (from aiohttp->datasets) (6.0.2)\n",
"Requirement already satisfied: yarl<2.0,>=1.0 in ./env/lib/python3.9/site-packages (from aiohttp->datasets) (1.7.2)\n",
"Requirement already satisfied: aiosignal>=1.1.2 in ./env/lib/python3.9/site-packages (from aiohttp->datasets) (1.2.0)\n",
"Requirement already satisfied: python-dateutil>=2.8.1 in ./env/lib/python3.9/site-packages (from pandas->datasets) (2.8.2)\n",
"Requirement already satisfied: pytz>=2020.1 in ./env/lib/python3.9/site-packages (from pandas->datasets) (2022.1)\n",
"Requirement already satisfied: six>=1.5 in ./env/lib/python3.9/site-packages (from python-dateutil>=2.8.1->pandas->datasets) (1.16.0)\n",
"Requirement already satisfied: torch in ./env/lib/python3.9/site-packages (1.11.0)\n",
"Requirement already satisfied: typing-extensions in ./env/lib/python3.9/site-packages (from torch) (4.2.0)\n"
]
}
],
"source": [
"!pip install transformers\n",
"!pip install datasets\n",
"!pip install torch"
]
},
{
"cell_type": "code",
"execution_count": 11,
"metadata": {},
"outputs": [],
"source": [
"# from pathlib import Path\n",
"\n",
"# from tokenizers import ByteLevelBPETokenizer\n",
"# from tokenizers.processors import BertProcessing\n",
"\n",
"import torch\n",
"from torch.utils.data.dataset import Dataset"
]
},
{
"cell_type": "code",
"execution_count": 12,
"metadata": {},
"outputs": [],
"source": [
"# %%time\n",
"# paths = [str(x) for x in Path(\".\").glob(\"text_split/*.txt\")]\n",
"\n",
"# # Initializer a tokenizer\n",
"# tokenizer = ByteLevelBPETokenizer(lowercase=True)\n",
"\n",
"# # Customizer training\n",
"# tokenizer.train(\n",
"# files=paths,\n",
"# vocab_size=8192,\n",
"# min_frequency=2,\n",
"# show_progress=True,\n",
"# special_tokens=[\"<s>\", \"<pad>\", \"</s>\", \"<mask>\"],)"
]
},
{
"cell_type": "code",
"execution_count": 13,
"metadata": {},
"outputs": [],
"source": [
"# # Save the Tokenizer to dist\n",
"# !rm -rf {tokenizer_folder}\n",
"# !mkdir {tokenizer_folder}\n",
"\n",
"# tokenizer.save_model(tokenizer_folder)"
]
},
{
"cell_type": "code",
"execution_count": 14,
"metadata": {},
"outputs": [],
"source": [
"# # Prepare the tokenizer\n",
"# tokenizer = ByteLevelBPETokenizer(\n",
"# os.path.abspath(os.path.join(tokenizer_folder, \"vocab.json\")),\n",
"# os.path.abspath(os.path.join(tokenizer_folder, \"merges.txt\"))\n",
"# )\n",
"# tokenizer.enable_truncation(max_length=512)"
]
},
{
"cell_type": "code",
"execution_count": 15,
"metadata": {},
"outputs": [],
"source": [
"# tokenizer.encode(train.patent_text.iloc[0]).tokens"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Train a language model from scratch"
]
},
{
"cell_type": "code",
"execution_count": 16,
"metadata": {},
"outputs": [],
"source": [
"TRAIN_BATCH_SIZE = 16\n",
"VALID_BATCH_SIZE = 8\n",
"TRAIN_EPOCHS = 15\n",
"LEARNING_RATE = 1e-4\n",
"WEIGHT_DECAY = 0.01\n",
"SEED = 42\n",
"MAX_LEN = 128\n",
"SUMMARY_LEN = 7"
]
},
{
"cell_type": "code",
"execution_count": 17,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Thu May 12 16:56:25 2022 \n",
"+-----------------------------------------------------------------------------+\n",
"| NVIDIA-SMI 465.19.01 Driver Version: 465.19.01 CUDA Version: 11.3 |\n",
"|-------------------------------+----------------------+----------------------+\n",
"| GPU Name Persistence-M| Bus-Id Disp.A | Volatile Uncorr. ECC |\n",
"| Fan Temp Perf Pwr:Usage/Cap| Memory-Usage | GPU-Util Compute M. |\n",
"| | | MIG M. |\n",
"|===============================+======================+======================|\n",
"| 0 NVIDIA GeForce ... Off | 00000000:01:00.0 Off | N/A |\n",
"| 0% 39C P8 7W / 198W | 42MiB / 8119MiB | 0% Default |\n",
"| | | N/A |\n",
"+-------------------------------+----------------------+----------------------+\n",
" \n",
"+-----------------------------------------------------------------------------+\n",
"| Processes: |\n",
"| GPU GI CI PID Type Process name GPU Memory |\n",
"| ID ID Usage |\n",
"|=============================================================================|\n",
"| 0 N/A N/A 1442 G /usr/lib/xorg/Xorg 39MiB |\n",
"+-----------------------------------------------------------------------------+\n"
]
}
],
"source": [
"# Check we have a GPU\n",
"!nvidia-smi"
]
},
{
"cell_type": "code",
"execution_count": 18,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"True"
]
},
"execution_count": 18,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# Check that PyTorch sees it\n",
"import torch\n",
"torch.cuda.is_available()"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Define the model"
]
},
{
"cell_type": "code",
"execution_count": 19,
"metadata": {},
"outputs": [],
"source": [
"from transformers import RobertaConfig\n",
"\n",
"config = RobertaConfig(\n",
" vocab_size=8192,\n",
" max_position_embeddings=514,\n",
" num_attention_heads=12,\n",
" num_hidden_layers=6,\n",
" type_vocab_size=1,\n",
")"
]
},
{
"cell_type": "code",
"execution_count": 20,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Num parameters: 49816064\n"
]
}
],
"source": [
"from transformers import RobertaForMaskedLM\n",
"\n",
"model = RobertaForMaskedLM(config=config)\n",
"print(f\"Num parameters: {model.num_parameters()}\")"
]
},
{
"cell_type": "code",
"execution_count": 21,
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.\n"
]
}
],
"source": [
"from transformers import RobertaTokenizerFast\n",
"\n",
"# Create the tokenizer from a trained one\n",
"tokenizer = RobertaTokenizerFast.from_pretrained(tokenizer_folder, max_len=MAX_LEN)"
]
},
{
"cell_type": "code",
"execution_count": 22,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"PreTrainedTokenizerFast(name_or_path='tokenizer', vocab_size=8192, model_max_len=128, is_fast=True, padding_side='right', truncation_side='right', special_tokens={'bos_token': AddedToken(\"<s>\", rstrip=False, lstrip=False, single_word=False, normalized=True), 'eos_token': AddedToken(\"</s>\", rstrip=False, lstrip=False, single_word=False, normalized=True), 'unk_token': AddedToken(\"<unk>\", rstrip=False, lstrip=False, single_word=False, normalized=True), 'sep_token': AddedToken(\"</s>\", rstrip=False, lstrip=False, single_word=False, normalized=True), 'pad_token': AddedToken(\"<pad>\", rstrip=False, lstrip=False, single_word=False, normalized=True), 'cls_token': AddedToken(\"<s>\", rstrip=False, lstrip=False, single_word=False, normalized=True), 'mask_token': AddedToken(\"<mask>\", rstrip=False, lstrip=True, single_word=False, normalized=True)})"
]
},
"execution_count": 22,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"tokenizer"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Building the training Dataset"
]
},
{
"cell_type": "code",
"execution_count": 23,
"metadata": {},
"outputs": [],
"source": [
"class CustomDataset(Dataset):\n",
" def __init__(self, df, tokenizer):\n",
" self.examples = []\n",
" for example in df.values:\n",
" x = tokenizer.encode_plus(example, max_length=MAX_LEN, truncation=True, padding=True)\n",
" self.examples += [x.input_ids]\n",
"\n",
" def __len__(self):\n",
" return len(self.examples)\n",
"\n",
" def __getitem__(self, i):\n",
" return torch.tensor(self.examples[i])"
]
},
{
"cell_type": "code",
"execution_count": 24,
"metadata": {},
"outputs": [],
"source": [
"df = pd.concat([train, test])"
]
},
{
"cell_type": "code",
"execution_count": 25,
"metadata": {},
"outputs": [],
"source": [
"train_dataset = CustomDataset(train.patent_text, tokenizer)\n",
"eval_dataset = CustomDataset(test.patent_text, tokenizer)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Define the Data Collator for masking our language"
]
},
{
"cell_type": "code",
"execution_count": 26,
"metadata": {},
"outputs": [],
"source": [
"from transformers import DataCollatorForLanguageModeling\n",
"\n",
"# Define the Data Collator\n",
"data_collator = DataCollatorForLanguageModeling(\n",
" tokenizer=tokenizer, mlm=True, mlm_probability=0.15,\n",
")"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"### Initializer and train our Trainer"
]
},
{
"cell_type": "code",
"execution_count": 27,
"metadata": {},
"outputs": [],
"source": [
"model_folder = \"RoBERT\"\n",
"\n",
"!rm -rf {model_folder}\n",
"!mkdir {model_folder}"
]
},
{
"cell_type": "code",
"execution_count": 28,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"RoBERT\n"
]
}
],
"source": [
"from transformers import Trainer, TrainingArguments\n",
"\n",
"print(model_folder)\n",
"# Define the training arguments\n",
"training_args = TrainingArguments(\n",
" output_dir=model_folder,\n",
" overwrite_output_dir=True,\n",
" evaluation_strategy=\"epoch\",\n",
" num_train_epochs=TRAIN_EPOCHS,\n",
" learning_rate=LEARNING_RATE,\n",
" weight_decay=WEIGHT_DECAY,\n",
" per_device_train_batch_size=TRAIN_BATCH_SIZE,\n",
" per_device_eval_batch_size=VALID_BATCH_SIZE,\n",
" save_steps=8192,\n",
" #eval_steps=4096,\n",
" save_total_limit=2,\n",
")\n",
"# Create the Trainer for out model\n",
"trainer = Trainer(\n",
" model=model,\n",
" args=training_args,\n",
" data_collator=data_collator,\n",
" train_dataset=train_dataset,\n",
" eval_dataset=eval_dataset,\n",
" #prediction_loss_only=True,\n",
")"
]
},
{
"cell_type": "code",
"execution_count": 29,
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/optimization.py:306: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
" warnings.warn(\n",
"***** Running training *****\n",
" Num examples = 77174\n",
" Num Epochs = 15\n",
" Instantaneous batch size per device = 16\n",
" Total train batch size (w. parallel, distributed & accumulation) = 16\n",
" Gradient Accumulation steps = 1\n",
" Total optimization steps = 72360\n"
]
},
{
"data": {
"application/vnd.jupyter.widget-view+json": {
"model_id": "aec8c68996894fa99e858009e1407589",
"version_major": 2,
"version_minor": 0
},
"text/plain": [
" 0%| | 0/72360 [00:00<?, ?it/s]"
]
},
"metadata": {},
"output_type": "display_data"
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"{'loss': 6.5111, 'learning_rate': 9.930901050304035e-05, 'epoch': 0.1}\n"
]
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [0,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [1,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [2,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [3,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [4,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [5,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [6,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [7,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [8,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [9,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [10,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [11,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [12,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [13,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [14,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [15,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [16,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [17,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [18,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [19,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [20,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [21,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [22,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [23,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [24,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [25,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [26,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [27,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [28,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [29,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [30,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [31,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [96,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [97,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [98,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [99,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [100,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [101,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [102,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [103,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [104,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [105,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [106,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [107,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [108,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [109,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [110,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [111,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [112,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [113,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [114,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [115,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [116,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [117,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [118,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [119,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [120,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [121,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [122,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [123,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [124,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [125,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [126,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [127,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [32,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [33,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [34,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [35,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [36,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [37,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [38,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [39,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [40,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [41,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [42,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [43,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [44,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [45,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [46,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [47,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [48,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [49,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [50,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [51,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [52,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [53,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [54,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [55,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [56,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [57,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [58,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [59,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [60,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [61,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [62,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [63,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [64,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [65,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [66,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [67,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [68,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [69,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [70,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [71,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [72,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [73,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [74,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [75,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [76,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [77,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [78,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [79,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [80,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [81,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [82,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [83,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [84,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [85,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [86,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [87,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [88,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [89,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [90,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [91,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [92,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [93,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [94,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [95,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [64,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [65,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [66,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [67,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [68,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [69,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [70,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [71,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [72,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [73,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [74,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [75,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [76,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [77,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [78,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [79,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [80,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [81,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [82,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [83,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [84,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [85,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [86,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [87,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [88,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [89,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [90,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [91,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [92,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [93,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [94,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [23,0,0], thread: [95,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [32,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [33,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [34,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [35,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [36,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [37,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [38,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [39,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [40,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [41,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [42,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [43,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [44,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [45,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [46,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [47,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [48,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [49,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [50,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [51,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [52,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [53,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [54,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [55,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [56,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [57,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [58,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [59,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [60,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [61,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [62,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [63,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [32,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [33,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [34,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [35,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [36,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [37,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [38,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [39,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [40,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [41,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [42,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [43,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [44,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [45,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [46,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [47,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [48,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [49,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [50,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [51,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [52,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [53,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [54,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [55,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [56,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [57,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [58,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [59,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [60,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [61,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [62,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [63,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [0,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [1,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [2,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [3,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [4,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [5,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [6,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [7,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [8,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [9,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [10,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [11,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [12,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [13,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [14,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [15,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [16,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [17,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [18,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [19,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [20,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [21,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [22,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [23,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [24,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [25,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [26,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [27,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [28,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [29,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [30,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [24,0,0], thread: [31,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [32,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [33,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [34,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [35,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [36,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [37,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [38,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [39,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [40,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [41,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [42,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [43,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [44,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [45,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [46,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [47,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [48,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [49,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [50,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [51,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [52,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [53,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [54,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [55,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [56,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [57,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [58,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [59,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [60,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [61,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [62,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [63,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [96,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [97,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [98,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [99,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [100,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [101,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [102,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [103,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [104,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [105,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [106,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [107,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [108,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [109,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [110,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [111,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [112,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [113,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [114,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [115,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [116,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [117,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [118,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [119,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [120,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [121,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [122,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [123,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [124,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [125,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [126,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [127,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [96,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [97,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [98,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [99,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [100,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [101,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [102,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [103,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [104,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [105,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [106,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [107,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [108,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [109,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [110,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [111,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [112,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [113,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [114,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [115,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [116,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [117,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [118,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [119,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [120,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [121,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [122,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [123,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [124,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [125,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [126,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [20,0,0], thread: [127,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [96,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [97,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [98,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [99,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [100,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [101,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [102,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [103,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [104,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [105,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [106,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [107,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [108,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [109,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [110,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [111,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [112,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [113,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [114,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [115,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [116,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [117,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [118,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [119,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [120,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [121,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [122,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [123,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [124,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [125,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [126,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [127,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [64,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [65,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [66,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [67,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [68,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [69,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [70,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [71,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [72,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [73,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [74,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [75,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [76,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [77,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [78,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [79,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [80,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [81,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [82,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [83,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [84,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [85,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [86,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [87,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [88,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [89,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [90,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [91,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [92,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [93,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [94,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [22,0,0], thread: [95,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [64,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [65,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [66,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [67,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [68,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [69,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [70,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [71,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [72,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [73,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [74,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [75,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [76,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [77,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [78,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [79,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [80,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [81,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [82,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [83,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [84,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [85,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [86,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [87,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [88,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [89,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [90,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [91,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [92,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [93,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [94,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [95,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [0,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [1,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [2,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [3,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [4,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [5,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [6,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [7,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [8,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [9,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [10,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [11,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [12,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [13,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [14,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [15,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [16,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [17,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [18,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [19,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [20,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [21,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [22,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [23,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [24,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [25,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [26,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [27,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [28,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [29,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [30,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [31,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [0,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [1,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [2,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [3,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [4,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [5,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [6,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [7,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [8,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [9,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [10,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [11,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [12,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [13,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [14,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [15,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [16,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [17,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [18,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [19,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [20,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [21,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [22,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [23,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [24,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [25,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [26,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [27,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [28,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [29,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [30,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [21,0,0], thread: [31,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [64,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [65,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [66,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [67,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [68,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [69,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [70,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [71,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [72,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [73,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [74,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [75,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [76,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [77,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [78,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [79,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [80,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [81,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [82,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [83,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [84,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [85,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [86,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [87,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [88,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [89,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [90,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [91,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [92,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [93,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [94,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [95,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [32,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [33,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [34,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [35,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [36,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [37,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [38,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [39,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [40,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [41,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [42,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [43,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [44,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [45,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [46,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [47,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [48,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [49,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [50,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [51,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [52,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [53,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [54,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [55,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [56,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [57,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [58,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [59,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [60,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [61,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [62,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n",
"../aten/src/ATen/native/cuda/Indexing.cu:703: indexSelectLargeIndex: block: [25,0,0], thread: [63,0,0] Assertion `srcIndex < srcSelectDimSize` failed.\n"
]
},
{
"ename": "RuntimeError",
"evalue": "CUDA error: device-side assert triggered",
"output_type": "error",
"traceback": [
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
"\u001b[0;31mRuntimeError\u001b[0m Traceback (most recent call last)",
"\u001b[1;32m/home/alfos/workspace/darpa/train_huggingface_from_scratch/notebook.ipynb Cell 37'\u001b[0m in \u001b[0;36m<cell line: 2>\u001b[0;34m()\u001b[0m\n\u001b[1;32m <a href='vscode-notebook-cell:/home/alfos/workspace/darpa/train_huggingface_from_scratch/notebook.ipynb#ch0000036?line=0'>1</a>\u001b[0m \u001b[39m# Train the model\u001b[39;00m\n\u001b[0;32m----> <a href='vscode-notebook-cell:/home/alfos/workspace/darpa/train_huggingface_from_scratch/notebook.ipynb#ch0000036?line=1'>2</a>\u001b[0m trainer\u001b[39m.\u001b[39;49mtrain()\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py:1422\u001b[0m, in \u001b[0;36mTrainer.train\u001b[0;34m(self, resume_from_checkpoint, trial, ignore_keys_for_eval, **kwargs)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=1419'>1420</a>\u001b[0m tr_loss_step \u001b[39m=\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mtraining_step(model, inputs)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=1420'>1421</a>\u001b[0m \u001b[39melse\u001b[39;00m:\n\u001b[0;32m-> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=1421'>1422</a>\u001b[0m tr_loss_step \u001b[39m=\u001b[39m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mtraining_step(model, inputs)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=1423'>1424</a>\u001b[0m \u001b[39mif\u001b[39;00m (\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=1424'>1425</a>\u001b[0m args\u001b[39m.\u001b[39mlogging_nan_inf_filter\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=1425'>1426</a>\u001b[0m \u001b[39mand\u001b[39;00m \u001b[39mnot\u001b[39;00m is_torch_tpu_available()\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=1426'>1427</a>\u001b[0m \u001b[39mand\u001b[39;00m (torch\u001b[39m.\u001b[39misnan(tr_loss_step) \u001b[39mor\u001b[39;00m torch\u001b[39m.\u001b[39misinf(tr_loss_step))\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=1427'>1428</a>\u001b[0m ):\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=1428'>1429</a>\u001b[0m \u001b[39m# if loss is nan or inf simply add the average of previous logged losses\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=1429'>1430</a>\u001b[0m tr_loss \u001b[39m+\u001b[39m\u001b[39m=\u001b[39m tr_loss \u001b[39m/\u001b[39m (\u001b[39m1\u001b[39m \u001b[39m+\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mstate\u001b[39m.\u001b[39mglobal_step \u001b[39m-\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_globalstep_last_logged)\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py:2011\u001b[0m, in \u001b[0;36mTrainer.training_step\u001b[0;34m(self, model, inputs)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=2007'>2008</a>\u001b[0m \u001b[39mreturn\u001b[39;00m loss_mb\u001b[39m.\u001b[39mreduce_mean()\u001b[39m.\u001b[39mdetach()\u001b[39m.\u001b[39mto(\u001b[39mself\u001b[39m\u001b[39m.\u001b[39margs\u001b[39m.\u001b[39mdevice)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=2009'>2010</a>\u001b[0m \u001b[39mwith\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mautocast_smart_context_manager():\n\u001b[0;32m-> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=2010'>2011</a>\u001b[0m loss \u001b[39m=\u001b[39m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mcompute_loss(model, inputs)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=2012'>2013</a>\u001b[0m \u001b[39mif\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39margs\u001b[39m.\u001b[39mn_gpu \u001b[39m>\u001b[39m \u001b[39m1\u001b[39m:\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=2013'>2014</a>\u001b[0m loss \u001b[39m=\u001b[39m loss\u001b[39m.\u001b[39mmean() \u001b[39m# mean() to average on multi-gpu parallel training\u001b[39;00m\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py:2043\u001b[0m, in \u001b[0;36mTrainer.compute_loss\u001b[0;34m(self, model, inputs, return_outputs)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=2040'>2041</a>\u001b[0m \u001b[39melse\u001b[39;00m:\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=2041'>2042</a>\u001b[0m labels \u001b[39m=\u001b[39m \u001b[39mNone\u001b[39;00m\n\u001b[0;32m-> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=2042'>2043</a>\u001b[0m outputs \u001b[39m=\u001b[39m model(\u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49minputs)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=2043'>2044</a>\u001b[0m \u001b[39m# Save past state if it exists\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=2044'>2045</a>\u001b[0m \u001b[39m# TODO: this needs to be fixed and made cleaner later.\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/trainer.py?line=2045'>2046</a>\u001b[0m \u001b[39mif\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39margs\u001b[39m.\u001b[39mpast_index \u001b[39m>\u001b[39m\u001b[39m=\u001b[39m \u001b[39m0\u001b[39m:\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py:1110\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *input, **kwargs)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1105'>1106</a>\u001b[0m \u001b[39m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1106'>1107</a>\u001b[0m \u001b[39m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1107'>1108</a>\u001b[0m \u001b[39mif\u001b[39;00m \u001b[39mnot\u001b[39;00m (\u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_backward_hooks \u001b[39mor\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_forward_hooks \u001b[39mor\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_forward_pre_hooks \u001b[39mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1108'>1109</a>\u001b[0m \u001b[39mor\u001b[39;00m _global_forward_hooks \u001b[39mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1109'>1110</a>\u001b[0m \u001b[39mreturn\u001b[39;00m forward_call(\u001b[39m*\u001b[39;49m\u001b[39minput\u001b[39;49m, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1110'>1111</a>\u001b[0m \u001b[39m# Do not call functions when jit is used\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1111'>1112</a>\u001b[0m full_backward_hooks, non_full_backward_hooks \u001b[39m=\u001b[39m [], []\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py:1098\u001b[0m, in \u001b[0;36mRobertaForMaskedLM.forward\u001b[0;34m(self, input_ids, attention_mask, token_type_ids, position_ids, head_mask, inputs_embeds, encoder_hidden_states, encoder_attention_mask, labels, output_attentions, output_hidden_states, return_dict)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1087'>1088</a>\u001b[0m \u001b[39mr\u001b[39m\u001b[39m\"\"\"\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1088'>1089</a>\u001b[0m \u001b[39mlabels (`torch.LongTensor` of shape `(batch_size, sequence_length)`, *optional*):\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1089'>1090</a>\u001b[0m \u001b[39m Labels for computing the masked language modeling loss. Indices should be in `[-100, 0, ...,\u001b[39;00m\n\u001b[0;32m (...)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1093'>1094</a>\u001b[0m \u001b[39m Used to hide legacy arguments that have been deprecated.\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1094'>1095</a>\u001b[0m \u001b[39m\"\"\"\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1095'>1096</a>\u001b[0m return_dict \u001b[39m=\u001b[39m return_dict \u001b[39mif\u001b[39;00m return_dict \u001b[39mis\u001b[39;00m \u001b[39mnot\u001b[39;00m \u001b[39mNone\u001b[39;00m \u001b[39melse\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mconfig\u001b[39m.\u001b[39muse_return_dict\n\u001b[0;32m-> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1097'>1098</a>\u001b[0m outputs \u001b[39m=\u001b[39m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mroberta(\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1098'>1099</a>\u001b[0m input_ids,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1099'>1100</a>\u001b[0m attention_mask\u001b[39m=\u001b[39;49mattention_mask,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1100'>1101</a>\u001b[0m token_type_ids\u001b[39m=\u001b[39;49mtoken_type_ids,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1101'>1102</a>\u001b[0m position_ids\u001b[39m=\u001b[39;49mposition_ids,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1102'>1103</a>\u001b[0m head_mask\u001b[39m=\u001b[39;49mhead_mask,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1103'>1104</a>\u001b[0m inputs_embeds\u001b[39m=\u001b[39;49minputs_embeds,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1104'>1105</a>\u001b[0m encoder_hidden_states\u001b[39m=\u001b[39;49mencoder_hidden_states,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1105'>1106</a>\u001b[0m encoder_attention_mask\u001b[39m=\u001b[39;49mencoder_attention_mask,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1106'>1107</a>\u001b[0m output_attentions\u001b[39m=\u001b[39;49moutput_attentions,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1107'>1108</a>\u001b[0m output_hidden_states\u001b[39m=\u001b[39;49moutput_hidden_states,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1108'>1109</a>\u001b[0m return_dict\u001b[39m=\u001b[39;49mreturn_dict,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1109'>1110</a>\u001b[0m )\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1110'>1111</a>\u001b[0m sequence_output \u001b[39m=\u001b[39m outputs[\u001b[39m0\u001b[39m]\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=1111'>1112</a>\u001b[0m prediction_scores \u001b[39m=\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mlm_head(sequence_output)\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py:1110\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *input, **kwargs)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1105'>1106</a>\u001b[0m \u001b[39m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1106'>1107</a>\u001b[0m \u001b[39m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1107'>1108</a>\u001b[0m \u001b[39mif\u001b[39;00m \u001b[39mnot\u001b[39;00m (\u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_backward_hooks \u001b[39mor\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_forward_hooks \u001b[39mor\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_forward_pre_hooks \u001b[39mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1108'>1109</a>\u001b[0m \u001b[39mor\u001b[39;00m _global_forward_hooks \u001b[39mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1109'>1110</a>\u001b[0m \u001b[39mreturn\u001b[39;00m forward_call(\u001b[39m*\u001b[39;49m\u001b[39minput\u001b[39;49m, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1110'>1111</a>\u001b[0m \u001b[39m# Do not call functions when jit is used\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1111'>1112</a>\u001b[0m full_backward_hooks, non_full_backward_hooks \u001b[39m=\u001b[39m [], []\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py:844\u001b[0m, in \u001b[0;36mRobertaModel.forward\u001b[0;34m(self, input_ids, attention_mask, token_type_ids, position_ids, head_mask, inputs_embeds, encoder_hidden_states, encoder_attention_mask, past_key_values, use_cache, output_attentions, output_hidden_states, return_dict)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=836'>837</a>\u001b[0m \u001b[39m# Prepare head mask if needed\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=837'>838</a>\u001b[0m \u001b[39m# 1.0 in head_mask indicate we keep the head\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=838'>839</a>\u001b[0m \u001b[39m# attention_probs has shape bsz x n_heads x N x N\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=839'>840</a>\u001b[0m \u001b[39m# input head_mask has shape [num_heads] or [num_hidden_layers x num_heads]\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=840'>841</a>\u001b[0m \u001b[39m# and head_mask is converted to shape [num_hidden_layers x batch x num_heads x seq_length x seq_length]\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=841'>842</a>\u001b[0m head_mask \u001b[39m=\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mget_head_mask(head_mask, \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mconfig\u001b[39m.\u001b[39mnum_hidden_layers)\n\u001b[0;32m--> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=843'>844</a>\u001b[0m embedding_output \u001b[39m=\u001b[39m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49membeddings(\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=844'>845</a>\u001b[0m input_ids\u001b[39m=\u001b[39;49minput_ids,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=845'>846</a>\u001b[0m position_ids\u001b[39m=\u001b[39;49mposition_ids,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=846'>847</a>\u001b[0m token_type_ids\u001b[39m=\u001b[39;49mtoken_type_ids,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=847'>848</a>\u001b[0m inputs_embeds\u001b[39m=\u001b[39;49minputs_embeds,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=848'>849</a>\u001b[0m past_key_values_length\u001b[39m=\u001b[39;49mpast_key_values_length,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=849'>850</a>\u001b[0m )\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=850'>851</a>\u001b[0m encoder_outputs \u001b[39m=\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mencoder(\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=851'>852</a>\u001b[0m embedding_output,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=852'>853</a>\u001b[0m attention_mask\u001b[39m=\u001b[39mextended_attention_mask,\n\u001b[0;32m (...)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=860'>861</a>\u001b[0m return_dict\u001b[39m=\u001b[39mreturn_dict,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=861'>862</a>\u001b[0m )\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=862'>863</a>\u001b[0m sequence_output \u001b[39m=\u001b[39m encoder_outputs[\u001b[39m0\u001b[39m]\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py:1110\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *input, **kwargs)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1105'>1106</a>\u001b[0m \u001b[39m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1106'>1107</a>\u001b[0m \u001b[39m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1107'>1108</a>\u001b[0m \u001b[39mif\u001b[39;00m \u001b[39mnot\u001b[39;00m (\u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_backward_hooks \u001b[39mor\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_forward_hooks \u001b[39mor\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_forward_pre_hooks \u001b[39mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1108'>1109</a>\u001b[0m \u001b[39mor\u001b[39;00m _global_forward_hooks \u001b[39mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1109'>1110</a>\u001b[0m \u001b[39mreturn\u001b[39;00m forward_call(\u001b[39m*\u001b[39;49m\u001b[39minput\u001b[39;49m, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1110'>1111</a>\u001b[0m \u001b[39m# Do not call functions when jit is used\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1111'>1112</a>\u001b[0m full_backward_hooks, non_full_backward_hooks \u001b[39m=\u001b[39m [], []\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py:132\u001b[0m, in \u001b[0;36mRobertaEmbeddings.forward\u001b[0;34m(self, input_ids, token_type_ids, position_ids, inputs_embeds, past_key_values_length)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=128'>129</a>\u001b[0m token_type_ids \u001b[39m=\u001b[39m torch\u001b[39m.\u001b[39mzeros(input_shape, dtype\u001b[39m=\u001b[39mtorch\u001b[39m.\u001b[39mlong, device\u001b[39m=\u001b[39m\u001b[39mself\u001b[39m\u001b[39m.\u001b[39mposition_ids\u001b[39m.\u001b[39mdevice)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=130'>131</a>\u001b[0m \u001b[39mif\u001b[39;00m inputs_embeds \u001b[39mis\u001b[39;00m \u001b[39mNone\u001b[39;00m:\n\u001b[0;32m--> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=131'>132</a>\u001b[0m inputs_embeds \u001b[39m=\u001b[39m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mword_embeddings(input_ids)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=132'>133</a>\u001b[0m token_type_embeddings \u001b[39m=\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mtoken_type_embeddings(token_type_ids)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/transformers/models/roberta/modeling_roberta.py?line=134'>135</a>\u001b[0m embeddings \u001b[39m=\u001b[39m inputs_embeds \u001b[39m+\u001b[39m token_type_embeddings\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py:1110\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *input, **kwargs)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1105'>1106</a>\u001b[0m \u001b[39m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1106'>1107</a>\u001b[0m \u001b[39m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1107'>1108</a>\u001b[0m \u001b[39mif\u001b[39;00m \u001b[39mnot\u001b[39;00m (\u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_backward_hooks \u001b[39mor\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_forward_hooks \u001b[39mor\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_forward_pre_hooks \u001b[39mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1108'>1109</a>\u001b[0m \u001b[39mor\u001b[39;00m _global_forward_hooks \u001b[39mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1109'>1110</a>\u001b[0m \u001b[39mreturn\u001b[39;00m forward_call(\u001b[39m*\u001b[39;49m\u001b[39minput\u001b[39;49m, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs)\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1110'>1111</a>\u001b[0m \u001b[39m# Do not call functions when jit is used\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/module.py?line=1111'>1112</a>\u001b[0m full_backward_hooks, non_full_backward_hooks \u001b[39m=\u001b[39m [], []\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/sparse.py:158\u001b[0m, in \u001b[0;36mEmbedding.forward\u001b[0;34m(self, input)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/sparse.py?line=156'>157</a>\u001b[0m \u001b[39mdef\u001b[39;00m \u001b[39mforward\u001b[39m(\u001b[39mself\u001b[39m, \u001b[39minput\u001b[39m: Tensor) \u001b[39m-\u001b[39m\u001b[39m>\u001b[39m Tensor:\n\u001b[0;32m--> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/sparse.py?line=157'>158</a>\u001b[0m \u001b[39mreturn\u001b[39;00m F\u001b[39m.\u001b[39;49membedding(\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/sparse.py?line=158'>159</a>\u001b[0m \u001b[39minput\u001b[39;49m, \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mweight, \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mpadding_idx, \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mmax_norm,\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/modules/sparse.py?line=159'>160</a>\u001b[0m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mnorm_type, \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mscale_grad_by_freq, \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49msparse)\n",
"File \u001b[0;32m~/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/functional.py:2183\u001b[0m, in \u001b[0;36membedding\u001b[0;34m(input, weight, padding_idx, max_norm, norm_type, scale_grad_by_freq, sparse)\u001b[0m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/functional.py?line=2176'>2177</a>\u001b[0m \u001b[39m# Note [embedding_renorm set_grad_enabled]\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/functional.py?line=2177'>2178</a>\u001b[0m \u001b[39m# XXX: equivalent to\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/functional.py?line=2178'>2179</a>\u001b[0m \u001b[39m# with torch.no_grad():\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/functional.py?line=2179'>2180</a>\u001b[0m \u001b[39m# torch.embedding_renorm_\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/functional.py?line=2180'>2181</a>\u001b[0m \u001b[39m# remove once script supports set_grad_enabled\u001b[39;00m\n\u001b[1;32m <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/functional.py?line=2181'>2182</a>\u001b[0m _no_grad_embedding_renorm_(weight, \u001b[39minput\u001b[39m, max_norm, norm_type)\n\u001b[0;32m-> <a href='file:///home/alfos/workspace/darpa/train_huggingface_from_scratch/env/lib/python3.9/site-packages/torch/nn/functional.py?line=2182'>2183</a>\u001b[0m \u001b[39mreturn\u001b[39;00m torch\u001b[39m.\u001b[39;49membedding(weight, \u001b[39minput\u001b[39;49m, padding_idx, scale_grad_by_freq, sparse)\n",
"\u001b[0;31mRuntimeError\u001b[0m: CUDA error: device-side assert triggered"
]
}
],
"source": [
"# Train the model\n",
"trainer.train()"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"interpreter": {
"hash": "6264f85c0b37a06e4c227b113684058583ab955329524df471d3ea8b0cce5507"
},
"kernelspec": {
"display_name": "Python 3.9.7 ('env': venv)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.7"
},
"orig_nbformat": 4
},
"nbformat": 4,
"nbformat_minor": 2
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment