Xenova HF Staff commited on 1 day ago

Commit

8baf569

verified ·

1 Parent(s): 6f98127

Upload folder using huggingface_hub

Browse files

Files changed (20) hide show

.gitattributes +13 -0
chat_template.jinja +122 -0
config.json +131 -0
generation_config.json +10 -0
onnx/model_fp16.onnx +3 -0
onnx/model_fp16.onnx_data +3 -0
onnx/model_fp16.onnx_data_1 +3 -0
onnx/model_fp16.onnx_data_2 +3 -0
onnx/model_fp16.onnx_data_3 +3 -0
onnx/model_fp16.onnx_data_4 +3 -0
onnx/model_fp16.onnx_data_5 +3 -0
onnx/model_fp16.onnx_data_6 +3 -0
onnx/model_fp16.onnx_data_7 +3 -0
onnx/model_fp16.onnx_data_8 +3 -0
onnx/model_q4f16.onnx +3 -0
onnx/model_q4f16.onnx_data +3 -0
onnx/model_q4f16.onnx_data_1 +3 -0
onnx/model_q4f16.onnx_data_2 +3 -0
tokenizer.json +3 -0
tokenizer_config.json +16 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,16 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+onnx/model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
+onnx/model_fp16.onnx_data_1 filter=lfs diff=lfs merge=lfs -text
+onnx/model_fp16.onnx_data_2 filter=lfs diff=lfs merge=lfs -text
+onnx/model_fp16.onnx_data_3 filter=lfs diff=lfs merge=lfs -text
+onnx/model_fp16.onnx_data_4 filter=lfs diff=lfs merge=lfs -text
+onnx/model_fp16.onnx_data_5 filter=lfs diff=lfs merge=lfs -text
+onnx/model_fp16.onnx_data_6 filter=lfs diff=lfs merge=lfs -text
+onnx/model_fp16.onnx_data_7 filter=lfs diff=lfs merge=lfs -text
+onnx/model_fp16.onnx_data_8 filter=lfs diff=lfs merge=lfs -text
+onnx/model_q4f16.onnx_data filter=lfs diff=lfs merge=lfs -text
+onnx/model_q4f16.onnx_data_1 filter=lfs diff=lfs merge=lfs -text
+onnx/model_q4f16.onnx_data_2 filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

chat_template.jinja ADDED Viewed

	@@ -0,0 +1,122 @@

+{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) -%}
+{%- set emit = namespace(started=false) -%}
+{# ---------- Build base system message (always emitted) ---------- #}
+{%- set base_system = 'You are rnj-1, a foundation model trained by Essential AI.\n' -%}
+{# ---------- Optional tools preface as a synthetic system message ---------- #}
+{%- if tools %}
+  {%- set sys_preamble -%}
+# Tools
+You may call one or more functions to assist with the user query.
+You are provided with function signatures within <tools></tools> XML tags:
+<tools>
+{%- for tool in tools %}
+{{ "\n" ~ (tool | tojson) }}
+{% endfor %}
+</tools>
+For each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:
+<tool_call>
+{"name": <function-name>, "arguments": <args-json-object>}
+</tool_call>
+  {%- endset -%}
+  {# If the first user-provided message is system, include it above the tools preface #}
+  {%- set combined_system = (messages and messages[0].role == 'system')
+      and (messages[0].content is string) -%}
+  {%- set sys_content = (combined_system and (messages[0].content ~ "\n\n" ~ sys_preamble)) or sys_preamble -%}
+  {%- set content = '<|start_header_id|>system<|end_header_id|>\n' ~ base_system ~ '\n' ~ sys_content ~ '<|eot_id|>' -%}
+  {%- if not emit.started -%}{%- set content = bos_token ~ content -%}{%- set emit.started = true -%}{%- endif -%}
+  {{- content -}}
+{%- else %}
+  {# No tools: always emit base_system, and include user's system message if present #}
+  {%- set user_system_content = '' -%}
+  {%- if messages and messages[0].role == 'system' and (messages[0].content is string) -%}
+    {%- set user_system_content = '\n' ~ messages[0].content -%}
+  {%- endif -%}
+  {%- set content = '<|start_header_id|>system<|end_header_id|>\n' ~ base_system ~ user_system_content ~ '<|eot_id|>' -%}
+  {%- if not emit.started -%}{%- set content = bos_token ~ content -%}{%- set emit.started = true -%}{%- endif -%}
+  {{- content -}}
+{%- endif -%}
+{# ---------- Locate last user query for multi-step tool behavior ---------- #}
+{%- for message in messages[::-1] %}
+  {%- set index = (messages|length - 1) - loop.index0 -%}
+  {%- if ns.multi_step_tool
+        and message.role == "user"
+        and message.content is string
+        and not (message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) -%}
+    {%- set ns.multi_step_tool = false -%}
+    {%- set ns.last_query_index = index -%}
+  {%- endif -%}
+{%- endfor -%}
+{# ---------- Walk all messages and emit in Llama-3 format ---------- #}
+{%- for message in messages %}
+  {# normalize content #}
+  {%- if message.content is string -%}
+    {%- set content = message.content -%}
+  {%- else -%}
+    {%- set content = '' -%}
+  {%- endif -%}
+  {# --- user/system (non-initial system already handled above) --- #}
+  {%- if (message.role == "user") or (message.role == "system" and not loop.first) -%}
+    {%- set block = '<|start_header_id|>' ~ message.role ~ '<|end_header_id|>\n' ~ content ~ '<|eot_id|>' -%}
+    {%- if not emit.started -%}{%- set block = bos_token ~ block -%}{%- set emit.started = true -%}{%- endif -%}
+    {{- block -}}
+  {# --- assistant --- #}
+  {%- elif message.role == "assistant" -%}
+    {%- set body = content -%}
+    {%- set header = '<|start_header_id|>assistant<|end_header_id|>\n' -%}
+    {%- if not emit.started -%}{{ bos_token }}{%- set emit.started = true -%}{%- endif -%}
+    {{- header -}}
+    {% generation %}
+    {{- body -}}
+    {%- if message.tool_calls -%}
+      {%- for tool_call in message.tool_calls -%}
+        {%- if tool_call.function -%}{%- set tc = tool_call.function -%}{%- else -%}{%- set tc = tool_call -%}{%- endif -%}
+        {%- set args_json = (tc.arguments if (tc.arguments is string) else (tc.arguments | tojson)) -%}
+        {%- if loop.first -%}
+          {{- '<tool_call>\n{"name": "' ~ tc.name ~ '", "arguments": ' ~ args_json ~ '}\n</tool_call>' -}}
+        {%- else -%}
+          {{- '\n<tool_call>\n{"name": "' ~ tc.name ~ '", "arguments": ' ~ args_json ~ '}\n</tool_call>' -}}
+        {%- endif -%}
+      {%- endfor -%}
+    {%- endif -%}
+    {{- '<|eot_id|>' -}}{%- endgeneration -%}
+  {# --- tool messages are wrapped as synthetic user messages with <tool_response> --- #}
+  {%- elif message.role == "tool" -%}
+    {%- set open_user = (loop.first or (loop.index0 > 0 and messages[loop.index0 - 1].role != "tool")) -%}
+    {%- set close_user = (loop.last or (loop.index0 < messages|length - 1 and messages[loop.index0 + 1].role != "tool")) -%}
+    {%- if open_user -%}
+      {%- set header = '<|start_header_id|>user<|end_header_id|>\n' -%}
+      {%- if not emit.started -%}{%- set header = bos_token ~ header -%}{%- set emit.started = true -%}{%- endif -%}
+      {{- header -}}
+    {%- endif -%}
+    {%- if open_user -%}
+      {{- '<tool_response>\n' -}}
+    {%- else -%}
+      {{- '\n<tool_response>\n' -}}
+    {%- endif -%}
+    {{- content -}}
+    {{- '\n</tool_response>' -}}
+    {%- if close_user -%}
+      {{- '<|eot_id|>' -}}
+    {%- endif -%}
+  {%- endif -%}
+{%- endfor -%}
+{# ---------- Add generation prompt header for the model to continue ---------- #}
+{%- if add_generation_prompt -%}
+  {%- set tail = '<|start_header_id|>assistant<|end_header_id|>\n' -%}
+  {{- tail -}}
+{%- endif -%}

config.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "_sliding_window_pattern": 1,
+  "architectures": [
+    "Gemma3ForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "attn_logit_softcapping": null,
+  "bos_token_id": 2,
+  "cache_implementation": "hybrid",
+  "dtype": "float32",
+  "eos_token_id": 1,
+  "final_logit_softcapping": 30.0,
+  "head_dim": 128,
+  "hidden_act": "gelu_pytorch_tanh",
+  "hidden_activation": "gelu_pytorch_tanh",
+  "hidden_size": 4096,
+  "initializer_range": 0.02,
+  "intermediate_size": 16384,
+  "layer_type": [
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention"
+  ],
+  "layer_types": [
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention"
+  ],
+  "max_position_embeddings": 32768,
+  "model_type": "gemma3_text",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 32,
+  "num_key_value_heads": 8,
+  "pad_token_id": 0,
+  "query_pre_attn_scalar": 128,
+  "rms_norm_eps": 1e-06,
+  "rope_parameters": {
+    "full_attention": {
+      "attn_factor": 1.0,
+      "beta_fast": 64.0,
+      "beta_slow": 1.0,
+      "extrapolation_factor": 1.0,
+      "factor": 4.0,
+      "original_max_position_embeddings": 8192,
+      "rope_theta": 10000,
+      "rope_type": "yarn"
+    },
+    "rope_theta": null,
+    "rope_type": "default",
+    "sliding_attention": {
+      "rope_theta": 10000,
+      "rope_type": "default"
+    }
+  },
+  "sliding_window": 32768,
+  "sliding_window_pattern": 1,
+  "transformers_version": "5.0.0.dev0",
+  "use_bidirectional_attention": false,
+  "use_cache": true,
+  "vocab_size": 128256,
+  "transformers.js_config": {
+    "dtype": "q4f16",
+    "use_external_data_format": {
+      "model_fp16.onnx": 9,
+      "model_q4f16.onnx": 3
+    },
+    "kv_cache_dtype": {
+      "q4f16": "float16",
+      "fp16": "float16"
+    }
+  }
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 128000,
+  "cache_implementation": "hybrid",
+  "do_sample": true,
+  "eos_token_id": 128009,
+  "pad_token_id": 128001,
+  "temperature": 0.2,
+  "transformers_version": "5.0.0.dev0"
+}

onnx/model_fp16.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6763481820c99f88b219ef8e6bce1db9929d108620a2a6437a926fdcdfebd384
+size 504979

onnx/model_fp16.onnx_data ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:35cfb38e236478aad1824c62d9dcc0fb88e851482e0b36cfdde20b42a2651b41
+size 2082619392

onnx/model_fp16.onnx_data_1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4c31671ea730a7553f2ec672ea863d866227f67f6d1d2d28e60c1a024d0f83be
+size 1980006400

onnx/model_fp16.onnx_data_2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:88dba5de3c3e90bfa8493e06d94bc9ba1725f57418dbe0b57463f058bec599c9
+size 2080636928

onnx/model_fp16.onnx_data_3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:21825579d2392f30684a8f166073f41f1df008f5bfab996c0e3c9646153f47b9
+size 2080636928

onnx/model_fp16.onnx_data_4 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4b94f1000656f3ab8c30cc896eda041621c0573173b147ebaf97ec00de622fec
+size 2080669696

onnx/model_fp16.onnx_data_5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:952c3436cb035bf8de3077f47f27a44a0993e7425067b61b5795914d083b9af7
+size 2030338048

onnx/model_fp16.onnx_data_6 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a5fe38be50af847e1cf2a6037ea1a3cc6ac49a3f54674b7db2cbbdb90f9e527f
+size 2080636928

onnx/model_fp16.onnx_data_7 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:137ef50635ea2e0f4549ca22100ea7a697a99ccc0829c358ffcdaa8c3f7bf581
+size 2080636928

onnx/model_fp16.onnx_data_8 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:96066570bc06cec1477ef769f6722868a5c5a405255faa9885a79a9e7840040d
+size 134250496

onnx/model_q4f16.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:707393551025902b9af273c226a40a6d4e084e175793cad3168cb2f6fe04087a
+size 608779

onnx/model_q4f16.onnx_data ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5dec1d52dc1fa694905f49da2a5723990e79a614040df77343928381d7e60e79
+size 2074628096

onnx/model_q4f16.onnx_data_1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d12934aa9713e6520d9b3c89f4b2c2b8fa1d51e03acb0b1fbc4c03a6ef51b489
+size 2091909120

onnx/model_q4f16.onnx_data_2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4a4a03b201eaa920b6bb1c4d5fefc9b65f42f02a5e27101b922df808fa056102
+size 423919616

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fcd228d2df6206bf4b2df4207937aed031cb659115a8af2cf65ca20a98343b0c
+size 11574513

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "additional_special_tokens": null,
+  "backend": "tokenizers",
+  "bos_token": "<|begin_of_text|>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "<|end_of_text|>",
+  "is_local": false,
+  "model_input_names": [
+    "input_ids",
+    "attention_mask"
+  ],
+  "model_max_length": 1000000000000000019884624838656,
+  "model_specific_special_tokens": {},
+  "tokenizer_class": "TokenizersBackend",
+  "chat_template": "{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) -%}\n{%- set emit = namespace(started=false) -%}\n\n{# ---------- Build base system message (always emitted) ---------- #}\n{%- set base_system = 'You are rnj-1, a foundation model trained by Essential AI.\\n' -%}\n\n{# ---------- Optional tools preface as a synthetic system message ---------- #}\n{%- if tools %}\n  {%- set sys_preamble -%}\n# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>\n{%- for tool in tools %}\n{{ \"\\n\" ~ (tool | tojson) }}\n{% endfor %}\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call>\n  {%- endset -%}\n\n  {# If the first user-provided message is system, include it above the tools preface #}\n  {%- set combined_system = (messages and messages[0].role == 'system')\n      and (messages[0].content is string) -%}\n  {%- set sys_content = (combined_system and (messages[0].content ~ \"\\n\\n\" ~ sys_preamble)) or sys_preamble -%}\n\n  {%- set content = '<|start_header_id|>system<|end_header_id|>\\n' ~ base_system ~ '\\n' ~ sys_content ~ '<|eot_id|>' -%}\n  {%- if not emit.started -%}{%- set content = bos_token ~ content -%}{%- set emit.started = true -%}{%- endif -%}\n  {{- content -}}\n{%- else %}\n  {# No tools: always emit base_system, and include user's system message if present #}\n  {%- set user_system_content = '' -%}\n  {%- if messages and messages[0].role == 'system' and (messages[0].content is string) -%}\n    {%- set user_system_content = '\\n' ~ messages[0].content -%}\n  {%- endif -%}\n  {%- set content = '<|start_header_id|>system<|end_header_id|>\\n' ~ base_system ~ user_system_content ~ '<|eot_id|>' -%}\n  {%- if not emit.started -%}{%- set content = bos_token ~ content -%}{%- set emit.started = true -%}{%- endif -%}\n  {{- content -}}\n{%- endif -%}\n\n{# ---------- Locate last user query for multi-step tool behavior ---------- #}\n{%- for message in messages[::-1] %}\n  {%- set index = (messages|length - 1) - loop.index0 -%}\n  {%- if ns.multi_step_tool\n        and message.role == \"user\"\n        and message.content is string\n        and not (message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) -%}\n    {%- set ns.multi_step_tool = false -%}\n    {%- set ns.last_query_index = index -%}\n  {%- endif -%}\n{%- endfor -%}\n\n{# ---------- Walk all messages and emit in Llama-3 format ---------- #}\n{%- for message in messages %}\n  {# normalize content #}\n  {%- if message.content is string -%}\n    {%- set content = message.content -%}\n  {%- else -%}\n    {%- set content = '' -%}\n  {%- endif -%}\n\n  {# --- user/system (non-initial system already handled above) --- #}\n  {%- if (message.role == \"user\") or (message.role == \"system\" and not loop.first) -%}\n    {%- set block = '<|start_header_id|>' ~ message.role ~ '<|end_header_id|>\\n' ~ content ~ '<|eot_id|>' -%}\n    {%- if not emit.started -%}{%- set block = bos_token ~ block -%}{%- set emit.started = true -%}{%- endif -%}\n    {{- block -}}\n\n  {# --- assistant --- #}\n  {%- elif message.role == \"assistant\" -%}\n  \n    {%- set body = content -%}\n    {%- set header = '<|start_header_id|>assistant<|end_header_id|>\\n' -%}\n    {%- if not emit.started -%}{{ bos_token }}{%- set emit.started = true -%}{%- endif -%}\n    {{- header -}}\n    {% generation %}\n    {{- body -}}\n    {%- if message.tool_calls -%}\n      {%- for tool_call in message.tool_calls -%}\n        {%- if tool_call.function -%}{%- set tc = tool_call.function -%}{%- else -%}{%- set tc = tool_call -%}{%- endif -%}\n        {%- set args_json = (tc.arguments if (tc.arguments is string) else (tc.arguments | tojson)) -%}\n        {%- if loop.first -%}\n          {{- '<tool_call>\\n{\"name\": \"' ~ tc.name ~ '\", \"arguments\": ' ~ args_json ~ '}\\n</tool_call>' -}}\n        {%- else -%}\n          {{- '\\n<tool_call>\\n{\"name\": \"' ~ tc.name ~ '\", \"arguments\": ' ~ args_json ~ '}\\n</tool_call>' -}}\n        {%- endif -%}\n      {%- endfor -%}\n    {%- endif -%}\n    {{- '<|eot_id|>' -}}{%- endgeneration -%}\n  {# --- tool messages are wrapped as synthetic user messages with <tool_response> --- #}\n  {%- elif message.role == \"tool\" -%}\n    {%- set open_user = (loop.first or (loop.index0 > 0 and messages[loop.index0 - 1].role != \"tool\")) -%}\n    {%- set close_user = (loop.last or (loop.index0 < messages|length - 1 and messages[loop.index0 + 1].role != \"tool\")) -%}\n\n    {%- if open_user -%}\n      {%- set header = '<|start_header_id|>user<|end_header_id|>\\n' -%}\n      {%- if not emit.started -%}{%- set header = bos_token ~ header -%}{%- set emit.started = true -%}{%- endif -%}\n      {{- header -}}\n    {%- endif -%}\n    {%- if open_user -%}\n      {{- '<tool_response>\\n' -}}\n    {%- else -%}\n      {{- '\\n<tool_response>\\n' -}}\n    {%- endif -%}\n    {{- content -}}\n    {{- '\\n</tool_response>' -}}\n\n    {%- if close_user -%}\n      {{- '<|eot_id|>' -}}\n    {%- endif -%}\n  {%- endif -%}\n{%- endfor -%}\n\n{# ---------- Add generation prompt header for the model to continue ---------- #}\n{%- if add_generation_prompt -%}\n  {%- set tail = '<|start_header_id|>assistant<|end_header_id|>\\n' -%}\n  {{- tail -}}\n{%- endif -%}"
+}