vui-space / vui /tok.py
Harry Coultas Blum
tryin relative imports
a1a9d33
raw
history blame contribute delete
574 Bytes
import torch
from transformers import ByT5Tokenizer
class CustomByT5Tokenizer(ByT5Tokenizer):
def encode(self, text, add_special_tokens=False, **kwargs):
"""
Override the encode method.
Args:
text (str): Input text
add_special_tokens (bool): Whether to add BOS/EOS tokens
"""
# Use the parent class's encode method
tokens = super().encode(text, add_special_tokens=add_special_tokens, **kwargs)
return torch.tensor(tokens)
tok = CustomByT5Tokenizer.from_pretrained("google/byt5-small")