| -- model.embed_tokens rfn_err: 0.000000 max_diff/norm: 0.000000 sqnr: 79.869484 cos_err: 0.000000 | |
| -- model.layers.0 rfn_err: 0.000543 max_diff/norm: 0.000184 sqnr: 68.177185 cos_err: 0.000000 | |
| -- model.layers.1 rfn_err: 0.001513 max_diff/norm: 0.000866 sqnr: 65.447161 cos_err: 0.000001 | |
| -- model.layers.2 rfn_err: 0.003429 max_diff/norm: 0.002247 sqnr: 59.905907 cos_err: 0.000004 | |
| -- model.layers.3 rfn_err: 0.004892 max_diff/norm: 0.002883 sqnr: 55.291200 cos_err: 0.000008 | |
| -- model.layers.4 rfn_err: 0.005726 max_diff/norm: 0.003310 sqnr: 52.228319 cos_err: 0.000011 | |
| -- model.layers.5 rfn_err: 0.008686 max_diff/norm: 0.188249 sqnr: 49.429878 cos_err: 0.000017 | |
| -- model.layers.6 rfn_err: 0.009091 max_diff/norm: 0.187352 sqnr: 47.501211 cos_err: 0.000025 | |
| -- model.layers.7 rfn_err: 0.009506 max_diff/norm: 0.182608 sqnr: 45.382496 cos_err: 0.000034 | |
| -- model.layers.8 rfn_err: 0.010246 max_diff/norm: 0.180253 sqnr: 43.051331 cos_err: 0.000053 | |
| -- model.layers.9 rfn_err: 0.010918 max_diff/norm: 0.177052 sqnr: 41.321413 cos_err: 0.000071 | |
| -- model.layers.10 rfn_err: 0.011519 max_diff/norm: 0.174697 sqnr: 40.338670 cos_err: 0.000086 | |
| -- model.layers.11 rfn_err: 0.012264 max_diff/norm: 0.172930 sqnr: 39.208071 cos_err: 0.000108 | |
| -- model.layers.12 rfn_err: 0.013085 max_diff/norm: 0.171060 sqnr: 38.091909 cos_err: 0.000132 | |
| -- model.layers.13 rfn_err: 0.013903 max_diff/norm: 0.169636 sqnr: 37.261419 cos_err: 0.000158 | |
| -- model.layers.14 rfn_err: 0.014629 max_diff/norm: 0.168219 sqnr: 36.583158 cos_err: 0.000180 | |
| -- model.layers.15 rfn_err: 0.015628 max_diff/norm: 0.166202 sqnr: 35.780368 cos_err: 0.000212 | |
| -- model.layers.16 rfn_err: 0.016242 max_diff/norm: 0.163085 sqnr: 35.441346 cos_err: 0.000228 | |
| -- model.layers.17 rfn_err: 0.017188 max_diff/norm: 0.161503 sqnr: 34.837762 cos_err: 0.000263 | |
| -- model.layers.18 rfn_err: 0.018460 max_diff/norm: 0.160362 sqnr: 34.086316 cos_err: 0.000316 | |
| -- model.layers.19 rfn_err: 0.019807 max_diff/norm: 0.158439 sqnr: 33.417090 cos_err: 0.000372 | |
| -- model.layers.20 rfn_err: 0.021275 max_diff/norm: 0.156205 sqnr: 32.797049 cos_err: 0.000434 | |
| -- model.layers.21 rfn_err: 0.022793 max_diff/norm: 0.154088 sqnr: 32.250618 cos_err: 0.000510 | |
| -- model.layers.22 rfn_err: 0.025017 max_diff/norm: 0.151355 sqnr: 31.522344 cos_err: 0.000629 | |
| -- model.layers.23 rfn_err: 0.027571 max_diff/norm: 0.149713 sqnr: 30.720477 cos_err: 0.000811 | |
| -- model.layers.24 rfn_err: 0.030635 max_diff/norm: 0.143742 sqnr: 29.978750 cos_err: 0.001035 | |
| -- model.layers.25 rfn_err: 0.035260 max_diff/norm: 0.142449 sqnr: 28.921009 cos_err: 0.001450 | |
| -- model.layers.26 rfn_err: 0.041012 max_diff/norm: 0.142144 sqnr: 27.738527 cos_err: 0.001992 | |
| -- model.layers.27 rfn_err: 0.048649 max_diff/norm: 0.140497 sqnr: 26.724511 cos_err: 0.002842 | |
| -- model.layers.28 rfn_err: 0.075249 max_diff/norm: 0.138490 sqnr: 25.626220 cos_err: 0.004184 | |
| -- model.layers.29 rfn_err: 0.085114 max_diff/norm: 0.137145 sqnr: 24.873034 cos_err: 0.005033 | |
| -- model.layers.30 rfn_err: 0.093850 max_diff/norm: 0.133826 sqnr: 23.763328 cos_err: 0.006293 | |
| -- model.layers.31 rfn_err: 0.099443 max_diff/norm: 0.131075 sqnr: 23.143857 cos_err: 0.007078 | |
| -- model.layers.32 rfn_err: 0.110217 max_diff/norm: 0.127145 sqnr: 22.407360 cos_err: 0.007872 | |
| -- model.layers.33 rfn_err: 0.115368 max_diff/norm: 0.124526 sqnr: 21.812169 cos_err: 0.009041 | |
| -- model.layers.34 rfn_err: 0.118347 max_diff/norm: 0.120848 sqnr: 21.452885 cos_err: 0.009680 | |
| -- model.layers.35 rfn_err: 0.121983 max_diff/norm: 0.117505 sqnr: 21.180904 cos_err: 0.010409 | |
| -- model.layers.36 rfn_err: 0.129488 max_diff/norm: 0.115913 sqnr: 20.568714 cos_err: 0.011940 | |
| -- model.layers.37 rfn_err: 0.130546 max_diff/norm: 0.110626 sqnr: 20.523469 cos_err: 0.012070 | |
| -- model.layers.38 rfn_err: 0.134762 max_diff/norm: 0.107698 sqnr: 20.258577 cos_err: 0.013730 | |
| -- model.layers.39 rfn_err: 0.136458 max_diff/norm: 0.102443 sqnr: 20.352471 cos_err: 0.013488 | |
| -- model.layers.40 rfn_err: 0.138824 max_diff/norm: 0.099604 sqnr: 20.215974 cos_err: 0.013448 | |
| -- model.layers.41 rfn_err: 0.142556 max_diff/norm: 0.093639 sqnr: 20.129098 cos_err: 0.014499 | |
| -- model.layers.42 rfn_err: 0.147585 max_diff/norm: 0.089614 sqnr: 19.955028 cos_err: 0.015680 | |
| -- model.layers.43 rfn_err: 0.149174 max_diff/norm: 0.083302 sqnr: 20.070309 cos_err: 0.014730 | |
| -- model.layers.44 rfn_err: 0.155522 max_diff/norm: 0.079138 sqnr: 19.834189 cos_err: 0.015953 | |
| -- model.layers.45 rfn_err: 0.159260 max_diff/norm: 0.076222 sqnr: 19.685693 cos_err: 0.016491 | |
| -- model.layers.46 rfn_err: 0.159097 max_diff/norm: 0.071667 sqnr: 19.735605 cos_err: 0.016122 | |
| -- model.layers.47 rfn_err: 0.164939 max_diff/norm: 0.067849 sqnr: 19.584990 cos_err: 0.017165 | |
| -- model.layers.48 rfn_err: 0.165954 max_diff/norm: 0.064549 sqnr: 19.534291 cos_err: 0.017085 | |
| -- model.layers.49 rfn_err: 0.167305 max_diff/norm: 0.060484 sqnr: 19.525616 cos_err: 0.017809 | |
| -- model.layers.50 rfn_err: 0.168045 max_diff/norm: 0.057157 sqnr: 19.455932 cos_err: 0.018103 | |
| -- model.layers.51 rfn_err: 0.171497 max_diff/norm: 0.053969 sqnr: 19.336356 cos_err: 0.018967 | |
| -- model.layers.52 rfn_err: 0.171437 max_diff/norm: 0.050450 sqnr: 19.299448 cos_err: 0.019189 | |
| -- model.layers.53 rfn_err: 0.171026 max_diff/norm: 0.047735 sqnr: 19.203575 cos_err: 0.019697 | |
| -- model.layers.54 rfn_err: 0.170891 max_diff/norm: 0.045281 sqnr: 19.107354 cos_err: 0.019586 | |
| -- model.layers.55 rfn_err: 0.173012 max_diff/norm: 0.043646 sqnr: 18.910681 cos_err: 0.020545 | |
| -- model.layers.56 rfn_err: 0.172990 max_diff/norm: 0.041733 sqnr: 18.769338 cos_err: 0.020506 | |
| -- model.layers.57 rfn_err: 0.169792 max_diff/norm: 0.038496 sqnr: 18.663130 cos_err: 0.019758 | |
| -- model.layers.58 rfn_err: 0.161728 max_diff/norm: 0.036592 sqnr: 18.628091 cos_err: 0.017834 | |
| -- model.layers.59 rfn_err: 0.154931 max_diff/norm: 0.034570 sqnr: 18.614537 cos_err: 0.015379 | |
| -- model.layers.60 rfn_err: 0.146969 max_diff/norm: 0.030656 sqnr: 18.880935 cos_err: 0.012806 | |
| -- model.layers.61 rfn_err: 0.138028 max_diff/norm: 0.047421 sqnr: 19.416316 cos_err: 0.012273 | |
| -- model.norm rfn_err: 0.158195 max_diff/norm: 0.006963 sqnr: 19.225764 cos_err: 0.013913 | |
| -- A perplexity: 8.35782554 | |
| -- B perplexity: 8.34981264 | |
| -- A label in top-K: | |
| K = 1: 0.5596 | |
| K = 2: 0.6798 | |
| K = 3: 0.7387 | |
| K = 4: 0.7746 | |
| K = 5: 0.7998 | |
| -- B label in top-K: | |
| K = 1: 0.5598 | |
| K = 2: 0.6804 | |
| K = 3: 0.7390 | |
| K = 4: 0.7749 | |
| K = 5: 0.8005 | |
| -- Top-K agreement, A vs B: | |
| K = 1: 0.9449 | |
| K = 2: 0.8209 | |
| K = 3: 0.6651 | |
| K = 4: 0.5071 | |
| K = 5: 0.3670 | |
| -- KL divergence (A, B): 0.04015230 | |
| -- KL divergence (B, A): 0.04071388 | |