Skip to content

Commit 426c915

Browse files
authored
move tokenizer model to third party llama2 (#27)
1 parent a7e7e81 commit 426c915

2 files changed

Lines changed: 1 addition & 2 deletions

File tree

jetstream/tests/engine/test_token_utils.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ def decode(self, t: int) -> str:
4848

4949
class TokenUtilsTest(unittest.TestCase):
5050
def setup(self):
51-
tokenizer_path = "tokenizer.model"
51+
tokenizer_path = "third_party/llama2/tokenizer.model"
5252
current_dir = os.path.dirname(__file__)
5353
tokenizer_path = os.path.join(current_dir, tokenizer_path)
5454
print(f"model_path: {tokenizer_path}")
@@ -61,7 +61,6 @@ def test_decode_vs_piece(self):
6161
tokens = [304, 13, 2266, 526, 777, 9590, 2020, 29901]
6262
expeted_sp_output = []
6363
jt_output = []
64-
print(f"jt_output: {jt_output}")
6564
for t in tokens:
6665
expeted_sp_output.append(self.sp_tokenizer.decode([t]))
6766
jt_output.append(self.jt_tokenizer.decode(t))
File renamed without changes.

0 commit comments

Comments
 (0)