Spaces:
Running
on
Zero
Running
on
Zero
| # Copyright (c) Meta Platforms, Inc. and affiliates. | |
| import abc | |
| class Tokenizer(abc.ABC): | |
| def encode(self, text: str, add_bos: bool, add_eos: bool): | |
| pass | |
| def decode(self, tokens: list[int]): | |
| pass | |
| def get_token_offsets( | |
| self, text: str, tokens: list[int] | None = None | |
| ) -> tuple[list[str], list[int]]: | |
| """Return the offsets of the tokens in the original text. Only used for evaluation.""" | |
| pass | |