# NOT RUN {
tokenizer <- FullTokenizer("vocab.txt", TRUE)
tokenize(tokenizer, text = "a bunch of words")
# }
# NOT RUN {
tokenizer <- BasicTokenizer(TRUE)
tokenize(tokenizer, text = "a bunch of words")
# }
# NOT RUN {
vocab <- load_vocab(vocab_file = "vocab.txt")
tokenizer <- WordpieceTokenizer(vocab)
tokenize(tokenizer, text = "a bunch of words")
# }
Run the code above in your browser using DataLab