#@title
from IPython.display import HTML
HTML('')
! pip install datasets transformers[sentencepiece]
from transformers import AutoTokenizerFast
tokenizer = AutoTokenizerFast.from_pretrained('albert-base-v1’)
text = "3.2.1: let's get started!"
print(tokenizer.backend_tokenizer.pre_tokenizer.pre_tokenize_str(text))