diff --git a/.gitattributes b/.gitattributes index e5773c9db742e7caddd6b403bea8d8535c34494c..56095c5d5a036125dbbb8147e7ccf2e3089beed9 100644 --- a/.gitattributes +++ b/.gitattributes @@ -3127,3 +3127,68 @@ qwen3-4b-log-unary/model_layers_24_self_attn_o_proj_weight.sign filter=lfs diff= qwen3-4b-log-unary/model_layers_9_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text qwen3-4b-log-unary/model_layers_8_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text qwen3-4b-log-unary/model_layers_23_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_12_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_22_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_28_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_3_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_32_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_23_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_26_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_14_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_12_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_33_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_23_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_1_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_18_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_13_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_7_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_1_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_16_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_31_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_3_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_35_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_20_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_18_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_6_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_23_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_23_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_15_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_26_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_23_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_26_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_22_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_29_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_9_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_2_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_8_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_21_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_10_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_20_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_31_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_30_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_32_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_9_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_32_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_35_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_21_self_attn_o_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_25_self_attn_o_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_34_mlp_down_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_19_self_attn_q_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_25_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_18_mlp_down_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_0_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_13_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_6_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_1_mlp_gate_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_30_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_7_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_1_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_14_self_attn_v_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_11_mlp_up_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_30_self_attn_q_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_30_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_28_self_attn_k_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_0_mlp_up_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_7_self_attn_v_proj_weight.sign filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_16_mlp_gate_proj_weight.planes filter=lfs diff=lfs merge=lfs -text +qwen3-4b-log-unary/model_layers_29_self_attn_k_proj_weight.sign filter=lfs diff=lfs merge=lfs -text diff --git a/deepseek-r1-1.5b-unary/model_layers_14_self_attn_q_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_14_self_attn_q_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..e19416ac38523b6973fed2868cc08b57b808764e Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_14_self_attn_q_proj_weight.scales differ diff --git a/deepseek-r1-1.5b-unary/model_layers_1_mlp_up_proj_weight.scales b/deepseek-r1-1.5b-unary/model_layers_1_mlp_up_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..d35b08b5b5f164a9960993c7106c369951cf641a Binary files /dev/null and b/deepseek-r1-1.5b-unary/model_layers_1_mlp_up_proj_weight.scales differ diff --git a/qwen3-4b-log-unary/model_layers_0_mlp_up_proj_weight.sign b/qwen3-4b-log-unary/model_layers_0_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0a6b322944323a0c3863e1d9a9a90ce7240eb883 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_0_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14a813788b2c3a35297734a3441d9dee4428c54ae358a51f63592e7fb8aab4cc +size 3112960 diff --git a/qwen3-4b-log-unary/model_layers_0_self_attn_k_proj_weight.sign b/qwen3-4b-log-unary/model_layers_0_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..056facb0ddd4498eb07dc1cfce98e8c0f61199f8 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_0_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327328afcb3bc4ffbd38526a501f84bb9f6038b84497df3c306ebe7f076c6c16 +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_10_mlp_up_proj_weight.sign b/qwen3-4b-log-unary/model_layers_10_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..4c1c3ba8e7b2a46207fda14fee30ae6ccdcca904 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_10_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ca17d942e5fe0922c42a914bc9a64dcc0ebb7a4a18b4ef229b45b29e20a946d +size 3112960 diff --git a/qwen3-4b-log-unary/model_layers_11_mlp_up_proj_weight.planes b/qwen3-4b-log-unary/model_layers_11_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..365a90130f39775c5ab8b1e7d65d6219dbe875c9 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_11_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9f2641a115600c763dc86f868df8ba89c9c604306df3c67318395072c67c35a +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_12_mlp_down_proj_weight.planes b/qwen3-4b-log-unary/model_layers_12_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..e5a2ef6e8bf7d96c8baed50b26c0293f3312e2e8 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_12_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3ff2091c8dd9911ad615b9a967b81f7d36b057995fa519967400d68a6f4b2a4 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_12_self_attn_o_proj_weight.planes b/qwen3-4b-log-unary/model_layers_12_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..fd04f2adcdec64a958824c787b107b41a9ea533d --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_12_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a19a2e0866b66ecee574b2233ce0a8040ab32c11c2bbdf3146233793ea973926 +size 5242880 diff --git a/qwen3-4b-log-unary/model_layers_13_mlp_down_proj_weight.planes b/qwen3-4b-log-unary/model_layers_13_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..f07fe843d9789408827f4ce789ada8efe12078fe --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_13_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c6f1afb8a07bdbebf2f37fbd516a1a8c39212bd551f7546952f7123a94512a2 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_13_self_attn_v_proj_weight.sign b/qwen3-4b-log-unary/model_layers_13_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..2565dccb52636bfc05dbad12cb78228f6c7776ac --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_13_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef22657af38dfa55a6643d10d05f17bc07e7dd22dffb441335d241f43012735d +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_14_self_attn_o_proj_weight.sign b/qwen3-4b-log-unary/model_layers_14_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..2bb813e284025f5b9c4d43de29b6446c8e7139a7 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_14_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3be8872f5c3b18235d642feab7ef48883727e22b4e3a4a54d812b6a6d913b9f7 +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_14_self_attn_v_proj_weight.planes b/qwen3-4b-log-unary/model_layers_14_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..3800d77b37519956216ac06d379b340e130b1a87 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_14_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4961c31739ac7f2e449e9d91ddef9dee0b6cc83e249d1aec1317862df056d5ad +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_15_self_attn_k_proj_weight.sign b/qwen3-4b-log-unary/model_layers_15_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..10f9f78d89536f0f883bae5b23b9abf65d168cb7 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_15_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:100255bd7f8cf5dc54287f7b0035163521f93e2733db43a8ec4393dbc11bf847 +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_16_mlp_gate_proj_weight.planes b/qwen3-4b-log-unary/model_layers_16_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..48c626b78e46d67dd40a5d7d084709567aa33ffa --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_16_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6265e4381e7bc7d4e2e654d7f224ae3908964ef539decc45341d808a0d058a3d +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_16_self_attn_k_proj_weight.sign b/qwen3-4b-log-unary/model_layers_16_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ee781b701fc4e95f620cd3aaf95666095f4e22b9 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_16_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd6c26ba0abbb345403f7aee428b24d0d7953d96cd51297f9d6f291eaa82280 +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_18_mlp_down_proj_weight.planes b/qwen3-4b-log-unary/model_layers_18_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..a674cb2b95d916e869a55569b2cc0317c5024ddc --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_18_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:831dff145e99a8ab46f3aa2c36c89e9698f971291681ab426ddca683d5d369cc +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_18_mlp_down_proj_weight.sign b/qwen3-4b-log-unary/model_layers_18_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f67831d61713594b1977798de8d2e05629fbec56 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_18_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:191aab29a883acc5bebc9aaa662625ba6fd13bcbee37e450059bbcdd6b1eb64f +size 3112960 diff --git a/qwen3-4b-log-unary/model_layers_18_self_attn_k_proj_weight.sign b/qwen3-4b-log-unary/model_layers_18_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..0e1fd7cbc475deb8faf291acd90a2ff12cc23ba2 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_18_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0814e0957837478c9bff2ef5a07ee7e580d2f5675b5fa9fd345b8b07147042f +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_19_self_attn_q_proj_weight.sign b/qwen3-4b-log-unary/model_layers_19_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..7b87322ba53b24ddd53dee5193423acd266063bc --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_19_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0173e82b0140a65e1168f2caf6b75b06e12e1fa26cdfc25c5371b3fd90cd69e5 +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_1_mlp_gate_proj_weight.planes b/qwen3-4b-log-unary/model_layers_1_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..e786851989b0d8acfa6582cdc608c6615e23707a --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_1_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1950c4893f26b628a517bcad2fe850c84b8e363f1ae69636021448b7c92c27c +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_1_mlp_gate_proj_weight.sign b/qwen3-4b-log-unary/model_layers_1_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..4e29f0360db120309b7d5262d253a2b4ce71c9e7 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_1_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a20be68c85d530c6dcb0940e3c0fffcb478f4196f634c9553eb53920c66147dd +size 3112960 diff --git a/qwen3-4b-log-unary/model_layers_1_mlp_up_proj_weight.planes b/qwen3-4b-log-unary/model_layers_1_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..0b9007dc8cf6d2fb04c1304e3f3f8e6313400e42 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_1_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17198c1c69416665626281074b56abc7b22ffdbba6d8a87cf9bd7f548527759d +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_1_self_attn_v_proj_weight.planes b/qwen3-4b-log-unary/model_layers_1_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c4a6b7de23b8c499fed7e5d25d26be06d19d7e5b --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_1_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4e8ec0a25b4961c162f3dd9b7d334c3b575f53274e9335f661bc8be6314bfe3 +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_20_mlp_gate_proj_weight.sign b/qwen3-4b-log-unary/model_layers_20_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..98d0edab8e286b1d1b8aedefd99250d516637658 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_20_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f99b1d5a74e9ac3fa3043eeef11504dc3394ce4dfc998143c295fa0ad2f617b3 +size 3112960 diff --git a/qwen3-4b-log-unary/model_layers_20_self_attn_k_proj_weight.sign b/qwen3-4b-log-unary/model_layers_20_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d9246134185f4698ef0918f92ccacb72a3249e0c --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_20_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b59dca26592161ef5d9070645f0695b6fe1cc5906b242d9fcf652c1b5e0052d +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_21_mlp_gate_proj_weight.sign b/qwen3-4b-log-unary/model_layers_21_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3037cf2a7aa341517d296390eeab37d2fddf6691 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_21_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9bbf908f91410afdd4d3c3eff4c3f91667767de757f7d63dfa2c26bbe83097c +size 3112960 diff --git a/qwen3-4b-log-unary/model_layers_21_self_attn_o_proj_weight.planes b/qwen3-4b-log-unary/model_layers_21_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..289d9a91138b163662a7b3fd5bb050bd9d59290b --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_21_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82120adbd75ee1d2c5bddb0103731cebec09bc35e36b774cad7b352902fe2638 +size 5242880 diff --git a/qwen3-4b-log-unary/model_layers_22_mlp_down_proj_weight.planes b/qwen3-4b-log-unary/model_layers_22_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2247b221b42aaeebe075c585e784ed52a8e2ef82 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_22_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8de6de72036f0bc258349223fc5f4343960adaee078368fce4060b98de31b52 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_22_self_attn_k_proj_weight.sign b/qwen3-4b-log-unary/model_layers_22_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..d050a2545020361e9cca8058d4136faa0754a6e4 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_22_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55cc75ff7f3426037950e875ddbf69df634fbda22c7c5c01e24b9c09f37bd5de +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_23_mlp_gate_proj_weight.planes b/qwen3-4b-log-unary/model_layers_23_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..ba0283a88d934c92f36e4409334a8ef145d26a93 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_23_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c48599c82add73110884a259da694c46792501add3d0f9e2b23a1f5bba55320 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_23_mlp_up_proj_weight.planes b/qwen3-4b-log-unary/model_layers_23_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2afac44cc24dbfa0ab9f4921073dbe48c45ea191 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_23_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0122501c5e545dd57a6403e4ddd9efd9b88f3451d80b634a2b4e7780acfb4f25 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_23_self_attn_k_proj_weight.planes b/qwen3-4b-log-unary/model_layers_23_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..5c9ee1efcd1eeac03004a7ea86614fb6793474cf --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_23_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:826675deefa641a96d11afcac4fcb24b1519c66d7d343c03e059265c72e19e32 +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_23_self_attn_o_proj_weight.planes b/qwen3-4b-log-unary/model_layers_23_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..fe5ff8e86068a0e9acad84425d0c466a49dc1585 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_23_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae7912cfaf9ccddc51e1678f9b256f4055d2e8b7c83b337fc93b1e500b81d6e4 +size 5242880 diff --git a/qwen3-4b-log-unary/model_layers_23_self_attn_q_proj_weight.sign b/qwen3-4b-log-unary/model_layers_23_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a23754efa2d8a8b2f06362044b23594556f52f1b --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_23_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a362881ac91375acf3d900b6d5d9fc9f6408cd5fa7e7428eec8cd05f4037256e +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_25_self_attn_o_proj_weight.sign b/qwen3-4b-log-unary/model_layers_25_self_attn_o_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..366d68f47612aca1fd3b85b012e4c497ae7ab944 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_25_self_attn_o_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0b9f9b0a8748b9f34b8d2dfccff7ed3fc179a387fe6da714620e013a7208af7 +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_25_self_attn_q_proj_weight.planes b/qwen3-4b-log-unary/model_layers_25_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8cae56bc512e375bdb9cc1204c102e9d403d4c9b --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_25_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:401a270a554f5c73e44993294dea0b7403fa6a0013ea5348822b36976e7bb3b7 +size 5242880 diff --git a/qwen3-4b-log-unary/model_layers_26_self_attn_k_proj_weight.sign b/qwen3-4b-log-unary/model_layers_26_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..41e0f865d29fba32fe203737dd2dae15115e5791 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_26_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2d99330bd1b21e2339e558bb52411cf27b4159f31d058affa1b7d59df594185 +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_26_self_attn_q_proj_weight.planes b/qwen3-4b-log-unary/model_layers_26_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..201c0425341e2b4406c66dd0cc2a9dcfb1cd5d7a --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_26_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba60c7b999dddbe08f1593b57216df55072d7fc17be6201da8dd84307c6fd31b +size 5242880 diff --git a/qwen3-4b-log-unary/model_layers_26_self_attn_v_proj_weight.sign b/qwen3-4b-log-unary/model_layers_26_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f2fdf3974d5d72374b7ec268cf8e65777f5d0a1f --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_26_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0ffa8954fb39b2ebe7507d1476e88d0f9f5e6de727da3a3d3ef013963176f51 +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_28_self_attn_k_proj_weight.planes b/qwen3-4b-log-unary/model_layers_28_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..8720aeea22b48c4d8816badd56afb1b702fb5935 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_28_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93ba6afc01924044c8b9972a8ee0337686480899a7b351644c15befcc83f91bb +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_28_self_attn_v_proj_weight.planes b/qwen3-4b-log-unary/model_layers_28_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..1bf80948a5853c7dc2fcbf5972cf210ea3daca9b --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_28_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdd148b50c77fdb020447549911117e46dbbaef3c12dc410516226558b62f4ca +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_29_mlp_gate_proj_weight.sign b/qwen3-4b-log-unary/model_layers_29_mlp_gate_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..ac7a4dc2bab443cfb7b84995e84ede381cb3a501 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_29_mlp_gate_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00af432f4f613219c7a3c967f12fa1aa5f3fc420bc28f13044538b4d54dfb16f +size 3112960 diff --git a/qwen3-4b-log-unary/model_layers_29_self_attn_k_proj_weight.sign b/qwen3-4b-log-unary/model_layers_29_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..f732bd19ef3cec667e48fadc93687bbca19869d4 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_29_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bbf973d1150f3c86c3cfbdf58568415f16bbb82dae77c220b87ea69b31fb46e +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_2_mlp_down_proj_weight.planes b/qwen3-4b-log-unary/model_layers_2_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..19b519a14fa525c2c7cf0043e131435d2db87cf9 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_2_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0db77accc8606e4e431bd6fea2b2e88872366ef9f492cf1631fea524fce29d6 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_30_mlp_up_proj_weight.planes b/qwen3-4b-log-unary/model_layers_30_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..c7f073f853c6cbc9e4b560abe784c71348e9edcf --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_30_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa67c80ae31e101bebf428501e31bf3fd6eb415e36def3e5360ca9db4d5f0623 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_30_self_attn_k_proj_weight.sign b/qwen3-4b-log-unary/model_layers_30_self_attn_k_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..781de41037372127a14559b34ccb9b8d4b9074d7 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_30_self_attn_k_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:553707edea3c89f6ae36f110fcf87624f7426705f5f9ab92d3bffb2f3a3c59de +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_30_self_attn_q_proj_weight.planes b/qwen3-4b-log-unary/model_layers_30_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..676a8879888b4b995337f5ce4e23f235eba4f9a5 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_30_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e888d4031f4c177bab055cafd10a3f935343443b47d767c17d96ee8ea0137cf +size 5242880 diff --git a/qwen3-4b-log-unary/model_layers_30_self_attn_q_proj_weight.sign b/qwen3-4b-log-unary/model_layers_30_self_attn_q_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..75c290cde05238d0e1ce3cd54818de0a31859743 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_30_self_attn_q_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b6e658659017b404e3ebfae35ac74a8425c30c861c362737edb528316c44a75 +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_31_mlp_down_proj_weight.planes b/qwen3-4b-log-unary/model_layers_31_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..11067ac669b4814b7530a1143aaaa521f1798578 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_31_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eca51222f0664a3cf2c3e2f790d7bc5e21df65a644d09bb0f4a1a75990fca4e +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_31_self_attn_v_proj_weight.sign b/qwen3-4b-log-unary/model_layers_31_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..bfe2a14e77d93536aa6963c8c26af92cb2ff471a --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_31_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3614dc1465f91eb22d0c1ed3370504612ec658a4579589f21e7b083fc658ecfd +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_32_mlp_up_proj_weight.planes b/qwen3-4b-log-unary/model_layers_32_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..7d157dd856b5f35fc072bcec25731ee3b0ed8e5d --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_32_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:968e1faecb3bf5b7df481facc46db7b1bdad628b9acfd64e998696117fc6ccc8 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_32_self_attn_k_proj_weight.planes b/qwen3-4b-log-unary/model_layers_32_self_attn_k_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..93ac9b1dc9e9901dffca2b9a8c4056e4e851d3e4 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_32_self_attn_k_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0e19c01bf82f7d765987bf47ac551d3293b76792af3accc6c158d986ff8e3a7 +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_32_self_attn_v_proj_weight.planes b/qwen3-4b-log-unary/model_layers_32_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..dc91e82e35feb51a8ee3a7d167b12526b64a94b1 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_32_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ede63d12d4839ec0002e298ffb379a398db47cdff2558ce3cfff3b19c2e5d42 +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_33_self_attn_v_proj_weight.planes b/qwen3-4b-log-unary/model_layers_33_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..4127ed2a3e7ccad576132f4098b79bda01399c9f --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_33_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02fff19c06c0fcd96d59b2084916a4b51e4495e75dbad17f142beb7725d7329a +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_34_mlp_down_proj_weight.sign b/qwen3-4b-log-unary/model_layers_34_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..5d799081e08fd53f2f2d75e36e17c73efd40cb4e --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_34_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9138e09e71c789f2bc52a28f3dc893d638b79a2e079b915a8a8ff1ec863ea0ae +size 3112960 diff --git a/qwen3-4b-log-unary/model_layers_35_mlp_down_proj_weight.sign b/qwen3-4b-log-unary/model_layers_35_mlp_down_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..a89362920ce71ee8965b66c9280d603a19a4592c --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_35_mlp_down_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84fce60705fa4bd02603437fd94790ea5f874701376c4fb2498fc80b993c0c1e +size 3112960 diff --git a/qwen3-4b-log-unary/model_layers_35_self_attn_q_proj_weight.planes b/qwen3-4b-log-unary/model_layers_35_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..69aa9af27490dbd4816e70167e54a6a1785cdd53 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_35_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73d3305a01ce95b70add8f070aca112e7afba486427f5269998d2d0fa02688b +size 5242880 diff --git a/qwen3-4b-log-unary/model_layers_3_self_attn_o_proj_weight.planes b/qwen3-4b-log-unary/model_layers_3_self_attn_o_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..56e4ae31ef063908ab015850bc4d3e709c94bed8 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_3_self_attn_o_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fccfeed9afc3a7b16d41eee282e085e50827939b29e5a070c84445146d372212 +size 5242880 diff --git a/qwen3-4b-log-unary/model_layers_3_self_attn_q_proj_weight.planes b/qwen3-4b-log-unary/model_layers_3_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..097d7a1e6a63165906c7a11d4be5d8aeaa0140ad --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_3_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce56d4717616e3d444ba59a94abfb0ec17d898b1533779cbc319b56379dca705 +size 5242880 diff --git a/qwen3-4b-log-unary/model_layers_6_mlp_gate_proj_weight.planes b/qwen3-4b-log-unary/model_layers_6_mlp_gate_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..d5d6080e8958c2c8324a0b221724a925cb665b03 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_6_mlp_gate_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df9cc645a84a0d2cb2f4a16411bbae08a22d96e7ce14c1d7b5da46429f46a9f9 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_6_self_attn_v_proj_weight.planes b/qwen3-4b-log-unary/model_layers_6_self_attn_v_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..632234efbe41cb8b4905eb6089a903fb8ae7f075 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_6_self_attn_v_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:572c4600852f5f839ad20b8443f99e55fc1ed41fc7cf6934e211dd1b2e3f3fa9 +size 1310720 diff --git a/qwen3-4b-log-unary/model_layers_7_mlp_up_proj_weight.planes b/qwen3-4b-log-unary/model_layers_7_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..3d8c3ab39c023c8f6844132f6c2fc70f688d7215 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_7_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c8b0002db1c9bec9805242085784630b83cf99a0aa29ad8065e8b305ad52444 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_7_mlp_up_proj_weight.sign b/qwen3-4b-log-unary/model_layers_7_mlp_up_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..3bbab39592e55820dedc3d383b22c0778147163d --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_7_mlp_up_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:677419e3e94fe6bac9a712546763b783fe94890c2adde79f7f1e38b9ba414826 +size 3112960 diff --git a/qwen3-4b-log-unary/model_layers_7_self_attn_v_proj_weight.sign b/qwen3-4b-log-unary/model_layers_7_self_attn_v_proj_weight.sign new file mode 100644 index 0000000000000000000000000000000000000000..2bde8e7a1c0dc5786a59f7e1f8389ba80d58c9c7 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_7_self_attn_v_proj_weight.sign @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da7ce53e084a36861f15af93bb6085b9843861265e2e815078809e2686010c74 +size 327680 diff --git a/qwen3-4b-log-unary/model_layers_8_mlp_down_proj_weight.planes b/qwen3-4b-log-unary/model_layers_8_mlp_down_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..2bbb6871683e8b4aedb6df34b2d3336f703875cd --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_8_mlp_down_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e3e88dca7b599488a362e37d2bc509b5aa9274fbc488e312d55d8fe855ad94 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_9_mlp_up_proj_weight.planes b/qwen3-4b-log-unary/model_layers_9_mlp_up_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..0fffc0899e5030bb1e40f58afb73f6b68fbcf878 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_9_mlp_up_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f02c32701a8bcd6112c1d44cc0f581212398d92be18364439ba1565129f0044 +size 12451840 diff --git a/qwen3-4b-log-unary/model_layers_9_self_attn_q_proj_weight.planes b/qwen3-4b-log-unary/model_layers_9_self_attn_q_proj_weight.planes new file mode 100644 index 0000000000000000000000000000000000000000..834dfdb72dde73c2159c85ea543d7d761a5ea2c9 --- /dev/null +++ b/qwen3-4b-log-unary/model_layers_9_self_attn_q_proj_weight.planes @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a8403b19c3ad47c06ec6ff362ae8b794f0e0bc6c53fb163c14835ec79e65d0 +size 5242880 diff --git a/qwen3-4b-thinking-hf/model-00001-of-00003.safetensors b/qwen3-4b-thinking-hf/model-00001-of-00003.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9283db5ecbec606c21c3948b577df8b845934f3d --- /dev/null +++ b/qwen3-4b-thinking-hf/model-00001-of-00003.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98178c1cddbca8ad76102afdbf76e4df79b64b82377ad4dca34c755cac00571a +size 3957900840 diff --git a/qwen3-4b-thinking-hf/model-00002-of-00003.safetensors b/qwen3-4b-thinking-hf/model-00002-of-00003.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a789e04cb3865d37334314d148e02bf18ffff780 --- /dev/null +++ b/qwen3-4b-thinking-hf/model-00002-of-00003.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57b5bd1f667d420350f169342a90b50e5ffc2aa202ba1819da1af3367ff2261f +size 3987450520 diff --git a/qwen3-4b-thinking-unary/model_layers_13_input_layernorm_weight.fp16 b/qwen3-4b-thinking-unary/model_layers_13_input_layernorm_weight.fp16 new file mode 100644 index 0000000000000000000000000000000000000000..3d9eab9bef0050afccb6912b293ac2ea05c0617f Binary files /dev/null and b/qwen3-4b-thinking-unary/model_layers_13_input_layernorm_weight.fp16 differ diff --git a/qwen3-4b-thinking-unary/model_layers_20_self_attn_q_proj_weight.scales b/qwen3-4b-thinking-unary/model_layers_20_self_attn_q_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..7ec6f2f265bf974f305be83d087cb87638640304 Binary files /dev/null and b/qwen3-4b-thinking-unary/model_layers_20_self_attn_q_proj_weight.scales differ diff --git a/qwen3-4b-thinking-unary/model_layers_2_mlp_down_proj_weight.scales b/qwen3-4b-thinking-unary/model_layers_2_mlp_down_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..ca73e44ad18d64719007ff891df9bb196483ea1c Binary files /dev/null and b/qwen3-4b-thinking-unary/model_layers_2_mlp_down_proj_weight.scales differ diff --git a/qwen3-4b-thinking-unary/model_layers_4_self_attn_q_proj_weight.scales b/qwen3-4b-thinking-unary/model_layers_4_self_attn_q_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..6a69c051c04c9ac0c02a6d911e284663828258f7 Binary files /dev/null and b/qwen3-4b-thinking-unary/model_layers_4_self_attn_q_proj_weight.scales differ diff --git a/qwen3-4b-thinking-unary/model_layers_8_mlp_gate_proj_weight.scales b/qwen3-4b-thinking-unary/model_layers_8_mlp_gate_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..2f0eeb436c44103b62f24d93bf25797454cf2b92 Binary files /dev/null and b/qwen3-4b-thinking-unary/model_layers_8_mlp_gate_proj_weight.scales differ diff --git a/qwen3-4b-thinking-unary/model_layers_9_self_attn_q_proj_weight.scales b/qwen3-4b-thinking-unary/model_layers_9_self_attn_q_proj_weight.scales new file mode 100644 index 0000000000000000000000000000000000000000..aed372ea175426b6c0856b06cc3711f29fe91e1d Binary files /dev/null and b/qwen3-4b-thinking-unary/model_layers_9_self_attn_q_proj_weight.scales differ