mlabonne
/

SmolGRPO-135M

Text Generation

text-generation-inference

Model card Files Files and versions Community

mlabonne commited on Feb 26

Commit

48e4a71

·

verified ·

1 Parent(s): 3f747bf

Upload tokenizer

Files changed (2) hide show

tokenizer.json +8 -1
tokenizer_config.json +1 -0

tokenizer.json CHANGED Viewed

@@ -1,7 +1,14 @@
 {
   "version": "1.0",
   "truncation": null,
-  "padding": null,
   "added_tokens": [
     {
       "id": 0,

 {
   "version": "1.0",
   "truncation": null,
+  "padding": {
+    "strategy": "BatchLongest",
+    "direction": "Left",
+    "pad_to_multiple_of": null,
+    "pad_id": 2,
+    "pad_type_id": 0,
+    "pad_token": "<|im_end|>"
+  },
   "added_tokens": [
     {
       "id": 0,

tokenizer_config.json CHANGED Viewed

@@ -149,6 +149,7 @@
   "extra_special_tokens": {},
   "model_max_length": 2048,
   "pad_token": "<|im_end|>",
   "tokenizer_class": "GPT2Tokenizer",
   "unk_token": "<|endoftext|>",
   "vocab_size": 49152

   "extra_special_tokens": {},
   "model_max_length": 2048,
   "pad_token": "<|im_end|>",
+  "padding_side": "left",
   "tokenizer_class": "GPT2Tokenizer",
   "unk_token": "<|endoftext|>",
   "vocab_size": 49152