Created October 22, 2020 15:09
# Benchmarking inference performance with an without data loaders
Run this notebook on a CPU/GPU runtime and measure differences in inference execution times.
!pip install transformers --quiet
"from transformers import BertTokenizer, BertForSequenceClassification\n",
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
device
"tokenizer = BertTokenizer.from_pretrained('textattack/bert-base-uncased-CoLA', truncation=True)\n",
"import spacy\n",
"text = \"\"\"\n",
sents = [sent.text for sent in nlp(text).sents]
sents = sents*2
"### With DataLoader\n",
"encoded_data_val = tokenizer.batch_encode_plus(\n",
"input_ids_val = encoded_data_val['input_ids']\n",
"all_logits = np.empty([0,2])\n",
"### No dataloaders\n",
"all_logits2 = np.empty([0,2])\n",
"#check that results are practically identical in the two methods\n",
