Skip to content

Commit 2f66939

Browse files
committed
Fix chat script
1 parent 249525b commit 2f66939

2 files changed

Lines changed: 11 additions & 2 deletions

File tree

chat.py

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,8 @@
1010
from colored import fore_rgb, style
1111

1212
from src.nope_gpt.model import NoPEGPT
13-
from nope_gpt.memory import BufferWindowMemory
13+
from src.nope_gpt.tokenization import BaseTokenizer, ChatTokenizer
14+
from src.nope_gpt.memory import BufferWindowMemory
1415

1516
DEFAULT_SYSTEM_MESSAGE = (
1617
"You're a helpful AI assistant named NoPE GPT. "
@@ -52,7 +53,9 @@ def main():
5253
args.checkpoint_path, map_location=args.device, weights_only=False
5354
)
5455

55-
tokenizer = checkpoint["tokenizer"]
56+
tokenizer = BaseTokenizer.from_tiktoken(**checkpoint["tokenizer_args"])
57+
58+
tokenizer = ChatTokenizer(tokenizer)
5659

5760
model = NoPEGPT(**checkpoint["model_args"])
5861

src/nope_gpt/tokenization.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -146,6 +146,12 @@ class ChatTokenizer(ModelHubMixin):
146146

147147
RESPONSE_HEADER = "<|im_start|>assistant\n"
148148

149+
@classmethod
150+
def from_tiktoken(cls, name: str) -> Self:
151+
"""Instantiate a tokenizer from a pretrained tiktoken tokenizer."""
152+
153+
return cls(get_encoding(name))
154+
149155
@classmethod
150156
def _from_pretrained(
151157
cls,

0 commit comments

Comments
 (0)