xzuyn commited on
Commit
aabcc2f
·
verified ·
1 Parent(s): 11d97d6

Upload 4 files

Browse files
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "do_sample": true,
5
+ "eos_token_id": 2,
6
+ "transformers_version": "4.46.3"
7
+ }
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee57bd3271d8c200a06df40f9d7c94f8bb8f085b5cfb2d40907a794560df2ec3
3
- size 17078342
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65c87473250648ff00e0bbce348ad91c94609e132cfcc2adf56b6f1293d9afe6
3
+ size 9264495
tokenizer_config.json CHANGED
@@ -36,7 +36,7 @@
36
  "special": true
37
  },
38
  "4": {
39
- "content": "<SPECIAL_4>",
40
  "lstrip": false,
41
  "normalized": false,
42
  "rstrip": false,
@@ -8008,9 +8008,8 @@
8008
  "chat_template": "{%- set loop_messages = messages %}\n{%- for message in loop_messages %}\n {%- set content = '<|im_start|>' + message['role'] + '\\n'+ message['content'] | trim %}\n {%- if loop.index0 == 0 %}\n {%- set content = content %}\n {%- endif %}\n {%- if not (loop.last and message['role'] == 'assistant') %}\n {%- set content = content + '<|im_end|>\\n' %}\n {%- endif %}\n {{- content }}\n{%- endfor %}\n{%- if messages[-1]['role'] != 'assistant' %}\n {{- '<|im_start|>assistant\\n' }}\n{%- endif %}",
8009
  "clean_up_tokenization_spaces": false,
8010
  "eos_token": "<|im_end|>",
8011
- "extra_special_tokens": {},
8012
  "model_max_length": 1000000000000000019884624838656,
8013
  "pad_token": "<pad>",
8014
- "tokenizer_class": "PreTrainedTokenizer",
8015
  "unk_token": "<unk>"
8016
  }
 
36
  "special": true
37
  },
38
  "4": {
39
+ "content": "<SPECIAL_14>",
40
  "lstrip": false,
41
  "normalized": false,
42
  "rstrip": false,
 
8008
  "chat_template": "{%- set loop_messages = messages %}\n{%- for message in loop_messages %}\n {%- set content = '<|im_start|>' + message['role'] + '\\n'+ message['content'] | trim %}\n {%- if loop.index0 == 0 %}\n {%- set content = content %}\n {%- endif %}\n {%- if not (loop.last and message['role'] == 'assistant') %}\n {%- set content = content + '<|im_end|>\\n' %}\n {%- endif %}\n {{- content }}\n{%- endfor %}\n{%- if messages[-1]['role'] != 'assistant' %}\n {{- '<|im_start|>assistant\\n' }}\n{%- endif %}",
8009
  "clean_up_tokenization_spaces": false,
8010
  "eos_token": "<|im_end|>",
 
8011
  "model_max_length": 1000000000000000019884624838656,
8012
  "pad_token": "<pad>",
8013
+ "tokenizer_class": "PreTrainedTokenizerFast",
8014
  "unk_token": "<unk>"
8015
  }