chrisociepa commited on
Commit
474848e
1 Parent(s): 2c74a1f

Fix configs

Browse files
generation_config.json CHANGED
@@ -1,6 +1,8 @@
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
- "eos_token_id": 2,
5
- "transformers_version": "4.43.4"
 
 
6
  }
 
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
+ "eos_token_id": 32001,
5
+ "pad_token": 2,
6
+ "unk_token": 0,
7
+ "transformers_version": "4.39.3"
8
  }
special_tokens_map.json CHANGED
@@ -137,7 +137,7 @@
137
  "single_word": false
138
  },
139
  "eos_token": {
140
- "content": "</s>",
141
  "lstrip": false,
142
  "normalized": false,
143
  "rstrip": false,
 
137
  "single_word": false
138
  },
139
  "eos_token": {
140
+ "content": "<|im_end|>",
141
  "lstrip": false,
142
  "normalized": false,
143
  "rstrip": false,
tokenizer.json CHANGED
@@ -1203,6 +1203,12 @@
1203
  "post_processor": {
1204
  "type": "TemplateProcessing",
1205
  "single": [
 
 
 
 
 
 
1206
  {
1207
  "Sequence": {
1208
  "id": "A",
@@ -1211,12 +1217,24 @@
1211
  }
1212
  ],
1213
  "pair": [
 
 
 
 
 
 
1214
  {
1215
  "Sequence": {
1216
  "id": "A",
1217
  "type_id": 0
1218
  }
1219
  },
 
 
 
 
 
 
1220
  {
1221
  "Sequence": {
1222
  "id": "B",
@@ -1224,7 +1242,17 @@
1224
  }
1225
  }
1226
  ],
1227
- "special_tokens": {}
 
 
 
 
 
 
 
 
 
 
1228
  },
1229
  "decoder": {
1230
  "type": "Sequence",
 
1203
  "post_processor": {
1204
  "type": "TemplateProcessing",
1205
  "single": [
1206
+ {
1207
+ "SpecialToken": {
1208
+ "id": "<s>",
1209
+ "type_id": 0
1210
+ }
1211
+ },
1212
  {
1213
  "Sequence": {
1214
  "id": "A",
 
1217
  }
1218
  ],
1219
  "pair": [
1220
+ {
1221
+ "SpecialToken": {
1222
+ "id": "<s>",
1223
+ "type_id": 0
1224
+ }
1225
+ },
1226
  {
1227
  "Sequence": {
1228
  "id": "A",
1229
  "type_id": 0
1230
  }
1231
  },
1232
+ {
1233
+ "SpecialToken": {
1234
+ "id": "<s>",
1235
+ "type_id": 1
1236
+ }
1237
+ },
1238
  {
1239
  "Sequence": {
1240
  "id": "B",
 
1242
  }
1243
  }
1244
  ],
1245
+ "special_tokens": {
1246
+ "<s>": {
1247
+ "id": "<s>",
1248
+ "ids": [
1249
+ 1
1250
+ ],
1251
+ "tokens": [
1252
+ "<s>"
1253
+ ]
1254
+ }
1255
+ }
1256
  },
1257
  "decoder": {
1258
  "type": "Sequence",
tokenizer_config.json CHANGED
@@ -1185,7 +1185,7 @@
1185
  "bos_token": "<s>",
1186
  "chat_template": "{{bos_token}}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
1187
  "clean_up_tokenization_spaces": true,
1188
- "eos_token": "</s>",
1189
  "legacy": true,
1190
  "model_max_length": 1000000000000000019884624838656,
1191
  "pad_token": "</s>",
 
1185
  "bos_token": "<s>",
1186
  "chat_template": "{{bos_token}}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
1187
  "clean_up_tokenization_spaces": true,
1188
+ "eos_token": "<|im_end|>",
1189
  "legacy": true,
1190
  "model_max_length": 1000000000000000019884624838656,
1191
  "pad_token": "</s>",