File tree Expand file tree Collapse file tree 1 file changed +4
-4
lines changed
tests/torchtune/modules/tokenizers Expand file tree Collapse file tree 1 file changed +4
-4
lines changed Original file line number Diff line number Diff line change @@ -38,7 +38,6 @@ def texts(self):
38
38
@pytest .fixture
39
39
def token_ids (self ):
40
40
return [
41
- 0 ,
42
41
73 ,
43
42
503 ,
44
43
654 ,
@@ -64,17 +63,18 @@ def token_ids(self):
64
63
511 ,
65
64
115 ,
66
65
46 ,
67
- - 1 ,
68
66
]
69
67
70
68
def test_encode (self , tokenizer , texts , token_ids ):
71
- assert tokenizer .encode (texts [0 ]) == token_ids
69
+ assert tokenizer .encode (texts [0 ], add_bos = True , add_eos = True ) == [
70
+ 0
71
+ ] + token_ids + [- 1 ]
72
72
73
73
def test_decode (self , tokenizer , texts , token_ids ):
74
74
assert tokenizer .decode (token_ids ) == texts [0 ]
75
75
76
76
def test_encode_and_decode (self , tokenizer , texts ):
77
- token_ids = tokenizer .encode (texts [0 ])
77
+ token_ids = tokenizer .encode (texts [0 ], add_bos = False , add_eos = False )
78
78
decoded_text = tokenizer .decode (token_ids )
79
79
assert texts [0 ] == decoded_text
80
80
You can’t perform that action at this time.
0 commit comments