Source code for text_machina.src.tokenizers.openai
from typing import List
import tiktoken
from .base import Tokenizer
[docs]class OpenAITokenizer(Tokenizer):
"""
Tokenizer for OpenAI models.
"""
def __init__(self, model_name: str):
super().__init__(model_name)
self.tokenizer = tiktoken.encoding_for_model(self.model_name)