0% found this document useful (0 votes)

129 views5 pages

Transformer - Ipynb - Colab

Uploaded by

anishpujari25

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

129 views5 pages

Transformer - Ipynb - Colab

Uploaded by

anishpujari25

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 5

transformer.

ipynb - Colab 07/10/24, 2:22 PM

Text Prediction with Pre-trained Transformer Models

import torch
import string

from transformers import BertTokenizer, BertForMaskedLM

from transformers import XLNetTokenizer, XLNetLMHeadModel
from transformers import XLMRobertaTokenizer, XLMRobertaForMaskedLM
from transformers import BartTokenizer, BartForConditionalGeneration
from transformers import ElectraTokenizer, ElectraForMaskedLM
from transformers import RobertaTokenizer, RobertaForMaskedLM

# Load tokenizers and models

bert_tokenizer = BertTokenizer.from_pretrained('bert-base-uncased')
bert_model = BertForMaskedLM.from_pretrained('bert-base-uncased').eval()

xlnet_tokenizer = XLNetTokenizer.from_pretrained('xlnet-base-cased')
xlnet_model = XLNetLMHeadModel.from_pretrained('xlnet-base-cased').eval()

xlmroberta_tokenizer = XLMRobertaTokenizer.from_pretrained('xlm-roberta-base')
xlmroberta_model = XLMRobertaForMaskedLM.from_pretrained('xlm-roberta-base').eval()

bart_tokenizer = BartTokenizer.from_pretrained('facebook/bart-large')
bart_model = BartForConditionalGeneration.from_pretrained('facebook/bart-large').ev

electra_tokenizer = ElectraTokenizer.from_pretrained('google/electra-small-generato
electra_model = ElectraForMaskedLM.from_pretrained('google/electra-small-generator'

roberta_tokenizer = RobertaTokenizer.from_pretrained('roberta-base')
roberta_model = RobertaForMaskedLM.from_pretrained('roberta-base').eval()

top_k = 10

def decode(tokenizer, pred_idx, top_clean):

ignore_tokens = string.punctuation + '[PAD]'
tokens = []
for w in pred_idx:
token = tokenizer.decode([w], skip_special_tokens=True).strip()
if token and token not in ignore_tokens:
tokens.append(token.replace('##', ''))
return '\n'.join(tokens[:top_clean])

def encode(tokenizer, text_sentence, add_special_tokens=True):

text_sentence = text_sentence.replace('<mask>', tokenizer.mask_token)
if tokenizer.mask_token == text_sentence.split()[-1]:

https://colab.research.google.com/drive/1GHFch9YpGkKgVo5TMxtQP7pHIeLg2QHc#scrollTo=PG5DaRp5j88o Page 1 of 5
transformer.ipynb - Colab 07/10/24, 2:22 PM

text_sentence += ' .'

input_ids = torch.tensor([tokenizer.encode(text_sentence, add_special_tokens=ad

mask_idx = torch.where(input_ids == tokenizer.mask_token_id)[1].tolist()[0]
return input_ids, mask_idx

def get_all_predictions(text_sentence, top_clean=5):

predictions = {}

# ========================= BERT =================================

input_ids, mask_idx = encode(bert_tokenizer, text_sentence)
with torch.no_grad():
predict = bert_model(input_ids)[0]
predictions['bert'] = decode(bert_tokenizer, predict[0, mask_idx, :].topk(top_k

# ========================= XLNET =================================

input_ids, mask_idx = encode(xlnet_tokenizer, text_sentence, False)
perm_mask = torch.zeros((1, input_ids.shape[1], input_ids.shape[1]), dtype=torc
perm_mask[:, :, mask_idx] = 1.0
target_mapping = torch.zeros((1, 1, input_ids.shape[1]), dtype=torch.float)
target_mapping[0, 0, mask_idx] = 1.0

with torch.no_grad():
predict = xlnet_model(input_ids, perm_mask=perm_mask, target_mapping=target
predictions['xlnet'] = decode(xlnet_tokenizer, predict[0, 0, :].topk(top_k).ind

# ========================= XLM ROBERTA =================================

input_ids, mask_idx = encode(xlmroberta_tokenizer, text_sentence)
with torch.no_grad():
predict = xlmroberta_model(input_ids)[0]
predictions['xlm'] = decode(xlmroberta_tokenizer, predict[0, mask_idx, :].topk(

# ========================= BART =================================

input_ids, mask_idx = encode(bart_tokenizer, text_sentence)
with torch.no_grad():
predict = bart_model(input_ids)[0]
predictions['bart'] = decode(bart_tokenizer, predict[0, mask_idx, :].topk(top_k

# ========================= ELECTRA =================================

input_ids, mask_idx = encode(electra_tokenizer, text_sentence)
with torch.no_grad():
predict = electra_model(input_ids)[0]
predictions['electra'] = decode(electra_tokenizer, predict[0, mask_idx, :].topk

# ========================= ROBERTA =================================

input_ids, mask_idx = encode(roberta_tokenizer, text_sentence)
with torch.no_grad():
predict = roberta_model(input_ids)[0]

https://colab.research.google.com/drive/1GHFch9YpGkKgVo5TMxtQP7pHIeLg2QHc#scrollTo=PG5DaRp5j88o Page 2 of 5
transformer.ipynb - Colab 07/10/24, 2:22 PM

predictions['roberta'] = decode(roberta_tokenizer, predict[0, mask_idx, :].topk

return predictions

Some weights of the model checkpoint at bert-base-uncased were not used when in
- This IS expected if you are initializing BertForMaskedLM from the checkpoint
- This IS NOT expected if you are initializing BertForMaskedLM from the checkpo
Some weights of the model checkpoint at xlm-roberta-base were not used when ini
- This IS expected if you are initializing XLMRobertaForMaskedLM from the check
- This IS NOT expected if you are initializing XLMRobertaForMaskedLM from the c
pytorch_model.bin: 100% 1.02G/1.02G [00:00<00:00, 4.73MB/s]

tokenizer_config.json: 100% 48.0/48.0 [00:00<00:00, 901B/s]

vocab.txt: 100% 232k/232k [00:00<00:00, 3.72MB/s]

tokenizer.json: 100% 466k/466k [00:00<00:00, 7.95MB/s]

config.json: 100% 662/662 [00:00<00:00, 14.4kB/s]

pytorch_model.bin: 100% 54.2M/54.2M [00:01<00:00, 33.2MB/s]

tokenizer_config.json: 100% 25.0/25.0 [00:00<00:00, 392B/s]

vocab.json: 100% 899k/899k [00:00<00:00, 16.6MB/s]

merges.txt: 100% 456k/456k [00:00<00:00, 4.88MB/s]

tokenizer.json: 100% 1.36M/1.36M [00:00<00:00, 23.1MB/s]

config.json: 100% 481/481 [00:00<00:00, 5.57kB/s]

model.safetensors: 100% 499M/499M [00:08<00:00, 37.2MB/s]

https://colab.research.google.com/drive/1GHFch9YpGkKgVo5TMxtQP7pHIeLg2QHc#scrollTo=PG5DaRp5j88o Page 3 of 5
transformer.ipynb - Colab 07/10/24, 2:22 PM

text = "I am feeling great <mask>."

predictions = get_all_predictions(text)
for model, result in predictions.items():
print(f"{model.upper()} Predictions:\n{result}\n")

BERT Predictions:
for
about
with
now
and

XLNET Predictions:
awful
great
terrible
today
terrific

XLM Predictions:
in
i
at
for
and

BART Predictions:
and
today
…
physically
!!!

ELECTRA Predictions:
this
about
and
for
with

ROBERTA Predictions:
right
about
this
and
so

Start coding or generate with AI.

https://colab.research.google.com/drive/1GHFch9YpGkKgVo5TMxtQP7pHIeLg2QHc#scrollTo=PG5DaRp5j88o Page 4 of 5
transformer.ipynb - Colab 07/10/24, 2:22 PM

https://colab.research.google.com/drive/1GHFch9YpGkKgVo5TMxtQP7pHIeLg2QHc#scrollTo=PG5DaRp5j88o Page 5 of 5

The Illustrated Transformer - Jay Alammar - Visualizing Machine Learning One Concept at A Time - .Booklet
No ratings yet
The Illustrated Transformer - Jay Alammar - Visualizing Machine Learning One Concept at A Time - .Booklet
14 pages
BERT - Assignment - Jupyter Notebook
0% (2)
BERT - Assignment - Jupyter Notebook
8 pages
Siam Reiki Level 1 TBSRL1
No ratings yet
Siam Reiki Level 1 TBSRL1
41 pages
Deep Learning TensorFlow and Keras
No ratings yet
Deep Learning TensorFlow and Keras
454 pages
A Hands-On Guide To Text Classification With Transformer Models (XLNet, BERT, XLM, RoBERTa)
No ratings yet
A Hands-On Guide To Text Classification With Transformer Models (XLNet, BERT, XLM, RoBERTa)
9 pages
Classification CNN
No ratings yet
Classification CNN
7 pages
Text Classification With Transformer - 1716327784332
No ratings yet
Text Classification With Transformer - 1716327784332
3 pages
Fine-Tune Marian-MT Translation Model
No ratings yet
Fine-Tune Marian-MT Translation Model
9 pages
cl12 Huggingface
No ratings yet
cl12 Huggingface
34 pages
Medical Text Classifier GabrieldeOlaguibel
No ratings yet
Medical Text Classifier GabrieldeOlaguibel
12 pages
Hugging Face
100% (1)
Hugging Face
11 pages
Naseer Saab
No ratings yet
Naseer Saab
3 pages
Code Explanation
No ratings yet
Code Explanation
8 pages
Odir NN
No ratings yet
Odir NN
6 pages
DL Practical 09text Pre Processing
No ratings yet
DL Practical 09text Pre Processing
6 pages
Phase 2 Ibm
No ratings yet
Phase 2 Ibm
5 pages
IRT Lab Programs
No ratings yet
IRT Lab Programs
9 pages
NLP A3 Report
No ratings yet
NLP A3 Report
10 pages
Differ - Blog-Heres How You Can Build and Train GPT-2 From Scratch Using PyTorch
No ratings yet
Differ - Blog-Heres How You Can Build and Train GPT-2 From Scratch Using PyTorch
13 pages
Implementing BERT Tokenizers
No ratings yet
Implementing BERT Tokenizers
10 pages
Unsloth: Fast Llama-3 Training Guide
No ratings yet
Unsloth: Fast Llama-3 Training Guide
10 pages
Sentence Embedding Code
No ratings yet
Sentence Embedding Code
9 pages
Bert T
No ratings yet
Bert T
2 pages
Research Paper Summarization
No ratings yet
Research Paper Summarization
13 pages
Experiment 10 NLP
No ratings yet
Experiment 10 NLP
5 pages
Language Translation With NN - Transformer and Torchtext - PyTorch Tutorials 2.3.0+cu121 Documentation
No ratings yet
Language Translation With NN - Transformer and Torchtext - PyTorch Tutorials 2.3.0+cu121 Documentation
8 pages
Day 10 of Mastering LLMs - Tokenizers
No ratings yet
Day 10 of Mastering LLMs - Tokenizers
10 pages
Transformer
No ratings yet
Transformer
39 pages
Hand On Day 2 Salinan - Dari - 2 - Using - Transformers
No ratings yet
Hand On Day 2 Salinan - Dari - 2 - Using - Transformers
10 pages
13 2 Bert
No ratings yet
13 2 Bert
61 pages
Building A Large Language Model LLM From Scratch
No ratings yet
Building A Large Language Model LLM From Scratch
13 pages
Fine-Tuned Vs RAG Short Notes ?
No ratings yet
Fine-Tuned Vs RAG Short Notes ?
25 pages
Next Word Prediction With NLP and Deep Learning
No ratings yet
Next Word Prediction With NLP and Deep Learning
13 pages
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
No ratings yet
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
17 pages
Python NLP with Transformers
No ratings yet
Python NLP with Transformers
275 pages
Transformers Torch
No ratings yet
Transformers Torch
38 pages
Toeknizer
No ratings yet
Toeknizer
2 pages
NLP Exercise 10
No ratings yet
NLP Exercise 10
6 pages
Fast Llama Training Guide
No ratings yet
Fast Llama Training Guide
5 pages
DLT Experiment 2
No ratings yet
DLT Experiment 2
7 pages
ACL - 2020 - Mike Lewis - BART Denoising Sequence-To-Sequence Pre-Training For Natural Language Generation, Translation, and Comprehension
No ratings yet
ACL - 2020 - Mike Lewis - BART Denoising Sequence-To-Sequence Pre-Training For Natural Language Generation, Translation, and Comprehension
10 pages
4.1 Data Collection and Preprocessing
No ratings yet
4.1 Data Collection and Preprocessing
4 pages
Retorno 1
No ratings yet
Retorno 1
29 pages
2023 Aug How To Produce Data For A Neural networkORG
No ratings yet
2023 Aug How To Produce Data For A Neural networkORG
6 pages
7 Transformers
No ratings yet
7 Transformers
20 pages
22BCE9752 NLPDigital Assignment 02
No ratings yet
22BCE9752 NLPDigital Assignment 02
21 pages
QLSTMvs LSTM
No ratings yet
QLSTMvs LSTM
7 pages
Joshua K. Cage - Python Transformers by Huggingface Hands On - 101 Practical Implementation Hands-On of ALBERT - ViT - BigBird and Other Latest Models With Huggingface Transformers
No ratings yet
Joshua K. Cage - Python Transformers by Huggingface Hands On - 101 Practical Implementation Hands-On of ALBERT - ViT - BigBird and Other Latest Models With Huggingface Transformers
186 pages
Pre-Training BERT With Hugging Face Transformers and Habana Gaudi
No ratings yet
Pre-Training BERT With Hugging Face Transformers and Habana Gaudi
12 pages
Bert
No ratings yet
Bert
2 pages
UNIT-5 and 6
No ratings yet
UNIT-5 and 6
40 pages
Pretraining Part1 16 Mar 23 PDF
No ratings yet
Pretraining Part1 16 Mar 23 PDF
32 pages
Aiml 3
No ratings yet
Aiml 3
4 pages
Bert Tokenizer
No ratings yet
Bert Tokenizer
2 pages
Keras NER with Transformers Guide
No ratings yet
Keras NER with Transformers Guide
7 pages
Attention Mechanism
No ratings yet
Attention Mechanism
11 pages
NLP Model Pretraining with BART
No ratings yet
NLP Model Pretraining with BART
10 pages
Keras RNN Guide for Beginners
No ratings yet
Keras RNN Guide for Beginners
13 pages
Full Stack Syllabus
No ratings yet
Full Stack Syllabus
2 pages
Mod 4 Notes
No ratings yet
Mod 4 Notes
46 pages
CS 501 Course Outline DataMining
No ratings yet
CS 501 Course Outline DataMining
11 pages
Final Internship Report
No ratings yet
Final Internship Report
6 pages
CG User Agreement
No ratings yet
CG User Agreement
7 pages
MPDF
No ratings yet
MPDF
1 page
Wild Craft
No ratings yet
Wild Craft
1 page
Swift Programming Language - III
No ratings yet
Swift Programming Language - III
194 pages
JPN Pharma Brochure
No ratings yet
JPN Pharma Brochure
2 pages
English Present Tenses Practice
No ratings yet
English Present Tenses Practice
5 pages
Reyes Vernalyn D. Practicum 2
No ratings yet
Reyes Vernalyn D. Practicum 2
63 pages
FlowCon Green DN15 40 Tech Note 2024 03 EN
No ratings yet
FlowCon Green DN15 40 Tech Note 2024 03 EN
10 pages
Personal Statement
100% (1)
Personal Statement
3 pages
Top Ten Ways of Handling Guest Complaints
No ratings yet
Top Ten Ways of Handling Guest Complaints
6 pages
Interlocking Paver Block Making Cost: Top Layer 500
No ratings yet
Interlocking Paver Block Making Cost: Top Layer 500
5 pages
Subledger Accounting Program Report
No ratings yet
Subledger Accounting Program Report
3 pages
Week 1 Webinar
No ratings yet
Week 1 Webinar
26 pages
A Study of Interplay Between Judiciary and Parliament
100% (1)
A Study of Interplay Between Judiciary and Parliament
92 pages
Frankenstein: Rewriting Analysis
No ratings yet
Frankenstein: Rewriting Analysis
24 pages
Oracle iRecruitment Setup Guide
100% (1)
Oracle iRecruitment Setup Guide
33 pages
Delay-Tolerant Network Architecture
No ratings yet
Delay-Tolerant Network Architecture
17 pages
Bank Strategic Planning and Budgeting Process
No ratings yet
Bank Strategic Planning and Budgeting Process
18 pages
An Overview of Data Analysis and Interpretations in Research
No ratings yet
An Overview of Data Analysis and Interpretations in Research
3 pages
HGI Development Deck 2021
No ratings yet
HGI Development Deck 2021
57 pages
Business Apps Boost Efficiency
No ratings yet
Business Apps Boost Efficiency
3 pages
Httpbin (1) - HTTP Client Testing Service
No ratings yet
Httpbin (1) - HTTP Client Testing Service
2 pages
PHP Developer Training Course
No ratings yet
PHP Developer Training Course
10 pages
P5 Pre-Practical Exercise CHM 171 2904 (QP)
No ratings yet
P5 Pre-Practical Exercise CHM 171 2904 (QP)
4 pages
Reissuance Process - Lost Owner's Duplicate
No ratings yet
Reissuance Process - Lost Owner's Duplicate
5 pages
BR SprayMaster
No ratings yet
BR SprayMaster
16 pages
Ict Literacy
No ratings yet
Ict Literacy
36 pages
Luce Irigaray - Sharing The Fire - Outline of A Dialectics of Sensitivity (2019, Springer International Publishing - Palgrave Macmillan) PDF
100% (2)
Luce Irigaray - Sharing The Fire - Outline of A Dialectics of Sensitivity (2019, Springer International Publishing - Palgrave Macmillan) PDF
114 pages
PSNC Intervention Motion in MVP DC FERC Case
No ratings yet
PSNC Intervention Motion in MVP DC FERC Case
16 pages
Bio Enzyme Recipes
No ratings yet
Bio Enzyme Recipes
5 pages
A Review of Literature On Emotional Intelligence: Doa Naqvi
No ratings yet
A Review of Literature On Emotional Intelligence: Doa Naqvi
14 pages
Eng9045 3683
No ratings yet
Eng9045 3683
4 pages
Employment Law (Palgrave Law Masters) (PDFDrive)
No ratings yet
Employment Law (Palgrave Law Masters) (PDFDrive)
521 pages