llm-course

Форк
0
/
Quantize_models_with_ExLlamaV2.ipynb 
8505 строк · 512.7 Кб
1
{
2
  "nbformat": 4,
3
  "nbformat_minor": 0,
4
  "metadata": {
5
    "colab": {
6
      "provenance": [],
7
      "gpuType": "T4",
8
      "authorship_tag": "ABX9TyMkzVB0crkJL3VvXFtgSkwZ",
9
      "include_colab_link": true
10
    },
11
    "kernelspec": {
12
      "name": "python3",
13
      "display_name": "Python 3"
14
    },
15
    "language_info": {
16
      "name": "python"
17
    },
18
    "accelerator": "GPU",
19
    "widgets": {
20
      "application/vnd.jupyter.widget-state+json": {
21
        "da62083d1a3d4d62b76a92abec717a24": {
22
          "model_module": "@jupyter-widgets/controls",
23
          "model_name": "VBoxModel",
24
          "model_module_version": "1.5.0",
25
          "state": {
26
            "_dom_classes": [],
27
            "_model_module": "@jupyter-widgets/controls",
28
            "_model_module_version": "1.5.0",
29
            "_model_name": "VBoxModel",
30
            "_view_count": null,
31
            "_view_module": "@jupyter-widgets/controls",
32
            "_view_module_version": "1.5.0",
33
            "_view_name": "VBoxView",
34
            "box_style": "",
35
            "children": [
36
              "IPY_MODEL_12051bdac0aa466c91122f3cb0e1ab2b",
37
              "IPY_MODEL_e9569646ef72451496087c49a2487ddc",
38
              "IPY_MODEL_23fc55e87153404d90f55930f7f73988",
39
              "IPY_MODEL_903957b2c1404703b2e59a2875da77ec"
40
            ],
41
            "layout": "IPY_MODEL_05c1e6ba7977465092a69324888cf59e"
42
          }
43
        },
44
        "9109e78e934040a7a4fedc9e9a2b5751": {
45
          "model_module": "@jupyter-widgets/controls",
46
          "model_name": "HTMLModel",
47
          "model_module_version": "1.5.0",
48
          "state": {
49
            "_dom_classes": [],
50
            "_model_module": "@jupyter-widgets/controls",
51
            "_model_module_version": "1.5.0",
52
            "_model_name": "HTMLModel",
53
            "_view_count": null,
54
            "_view_module": "@jupyter-widgets/controls",
55
            "_view_module_version": "1.5.0",
56
            "_view_name": "HTMLView",
57
            "description": "",
58
            "description_tooltip": null,
59
            "layout": "IPY_MODEL_26073e1c5d284656be9c5fdb55276a25",
60
            "placeholder": "​",
61
            "style": "IPY_MODEL_51b1646d7e194c75b1109d16b8291c76",
62
            "value": "<center> <img\nsrc=https://huggingface.co/front/assets/huggingface_logo-noborder.svg\nalt='Hugging Face'> <br> Copy a token from <a\nhref=\"https://huggingface.co/settings/tokens\" target=\"_blank\">your Hugging Face\ntokens page</a> and paste it below. <br> Immediately click login after copying\nyour token or it might be stored in plain text in this notebook file. </center>"
63
          }
64
        },
65
        "e2bf96c3e5e946f5a832f3d5bcf86202": {
66
          "model_module": "@jupyter-widgets/controls",
67
          "model_name": "PasswordModel",
68
          "model_module_version": "1.5.0",
69
          "state": {
70
            "_dom_classes": [],
71
            "_model_module": "@jupyter-widgets/controls",
72
            "_model_module_version": "1.5.0",
73
            "_model_name": "PasswordModel",
74
            "_view_count": null,
75
            "_view_module": "@jupyter-widgets/controls",
76
            "_view_module_version": "1.5.0",
77
            "_view_name": "PasswordView",
78
            "continuous_update": true,
79
            "description": "Token:",
80
            "description_tooltip": null,
81
            "disabled": false,
82
            "layout": "IPY_MODEL_3efa5c88dc2d491c99678d73e4144eeb",
83
            "placeholder": "​",
84
            "style": "IPY_MODEL_b1dfa66aec6a4e86bff78e3a62905a3c",
85
            "value": ""
86
          }
87
        },
88
        "d83804efc2c34b628cda200bb40fa8db": {
89
          "model_module": "@jupyter-widgets/controls",
90
          "model_name": "CheckboxModel",
91
          "model_module_version": "1.5.0",
92
          "state": {
93
            "_dom_classes": [],
94
            "_model_module": "@jupyter-widgets/controls",
95
            "_model_module_version": "1.5.0",
96
            "_model_name": "CheckboxModel",
97
            "_view_count": null,
98
            "_view_module": "@jupyter-widgets/controls",
99
            "_view_module_version": "1.5.0",
100
            "_view_name": "CheckboxView",
101
            "description": "Add token as git credential?",
102
            "description_tooltip": null,
103
            "disabled": false,
104
            "indent": true,
105
            "layout": "IPY_MODEL_5e4cc08b7aa44cacae18fcc4131c174d",
106
            "style": "IPY_MODEL_813d16aa8a144cf7b3c1b08d096a2b20",
107
            "value": true
108
          }
109
        },
110
        "401d9fb01f054e6aaaf62b1546ab7686": {
111
          "model_module": "@jupyter-widgets/controls",
112
          "model_name": "ButtonModel",
113
          "model_module_version": "1.5.0",
114
          "state": {
115
            "_dom_classes": [],
116
            "_model_module": "@jupyter-widgets/controls",
117
            "_model_module_version": "1.5.0",
118
            "_model_name": "ButtonModel",
119
            "_view_count": null,
120
            "_view_module": "@jupyter-widgets/controls",
121
            "_view_module_version": "1.5.0",
122
            "_view_name": "ButtonView",
123
            "button_style": "",
124
            "description": "Login",
125
            "disabled": false,
126
            "icon": "",
127
            "layout": "IPY_MODEL_63c15146f75f473394ebcc165ca0d7f6",
128
            "style": "IPY_MODEL_cc10d97351604ee18918afa1d955a089",
129
            "tooltip": ""
130
          }
131
        },
132
        "9f6d67cf6b9748288044a8c7a98cc2e3": {
133
          "model_module": "@jupyter-widgets/controls",
134
          "model_name": "HTMLModel",
135
          "model_module_version": "1.5.0",
136
          "state": {
137
            "_dom_classes": [],
138
            "_model_module": "@jupyter-widgets/controls",
139
            "_model_module_version": "1.5.0",
140
            "_model_name": "HTMLModel",
141
            "_view_count": null,
142
            "_view_module": "@jupyter-widgets/controls",
143
            "_view_module_version": "1.5.0",
144
            "_view_name": "HTMLView",
145
            "description": "",
146
            "description_tooltip": null,
147
            "layout": "IPY_MODEL_6ff94a654ed54915b2082197920e89ab",
148
            "placeholder": "​",
149
            "style": "IPY_MODEL_dc9118ad41d247cab135811a183805e8",
150
            "value": "\n<b>Pro Tip:</b> If you don't already have one, you can create a dedicated\n'notebooks' token with 'write' access, that you can then easily reuse for all\nnotebooks. </center>"
151
          }
152
        },
153
        "05c1e6ba7977465092a69324888cf59e": {
154
          "model_module": "@jupyter-widgets/base",
155
          "model_name": "LayoutModel",
156
          "model_module_version": "1.2.0",
157
          "state": {
158
            "_model_module": "@jupyter-widgets/base",
159
            "_model_module_version": "1.2.0",
160
            "_model_name": "LayoutModel",
161
            "_view_count": null,
162
            "_view_module": "@jupyter-widgets/base",
163
            "_view_module_version": "1.2.0",
164
            "_view_name": "LayoutView",
165
            "align_content": null,
166
            "align_items": "center",
167
            "align_self": null,
168
            "border": null,
169
            "bottom": null,
170
            "display": "flex",
171
            "flex": null,
172
            "flex_flow": "column",
173
            "grid_area": null,
174
            "grid_auto_columns": null,
175
            "grid_auto_flow": null,
176
            "grid_auto_rows": null,
177
            "grid_column": null,
178
            "grid_gap": null,
179
            "grid_row": null,
180
            "grid_template_areas": null,
181
            "grid_template_columns": null,
182
            "grid_template_rows": null,
183
            "height": null,
184
            "justify_content": null,
185
            "justify_items": null,
186
            "left": null,
187
            "margin": null,
188
            "max_height": null,
189
            "max_width": null,
190
            "min_height": null,
191
            "min_width": null,
192
            "object_fit": null,
193
            "object_position": null,
194
            "order": null,
195
            "overflow": null,
196
            "overflow_x": null,
197
            "overflow_y": null,
198
            "padding": null,
199
            "right": null,
200
            "top": null,
201
            "visibility": null,
202
            "width": "50%"
203
          }
204
        },
205
        "26073e1c5d284656be9c5fdb55276a25": {
206
          "model_module": "@jupyter-widgets/base",
207
          "model_name": "LayoutModel",
208
          "model_module_version": "1.2.0",
209
          "state": {
210
            "_model_module": "@jupyter-widgets/base",
211
            "_model_module_version": "1.2.0",
212
            "_model_name": "LayoutModel",
213
            "_view_count": null,
214
            "_view_module": "@jupyter-widgets/base",
215
            "_view_module_version": "1.2.0",
216
            "_view_name": "LayoutView",
217
            "align_content": null,
218
            "align_items": null,
219
            "align_self": null,
220
            "border": null,
221
            "bottom": null,
222
            "display": null,
223
            "flex": null,
224
            "flex_flow": null,
225
            "grid_area": null,
226
            "grid_auto_columns": null,
227
            "grid_auto_flow": null,
228
            "grid_auto_rows": null,
229
            "grid_column": null,
230
            "grid_gap": null,
231
            "grid_row": null,
232
            "grid_template_areas": null,
233
            "grid_template_columns": null,
234
            "grid_template_rows": null,
235
            "height": null,
236
            "justify_content": null,
237
            "justify_items": null,
238
            "left": null,
239
            "margin": null,
240
            "max_height": null,
241
            "max_width": null,
242
            "min_height": null,
243
            "min_width": null,
244
            "object_fit": null,
245
            "object_position": null,
246
            "order": null,
247
            "overflow": null,
248
            "overflow_x": null,
249
            "overflow_y": null,
250
            "padding": null,
251
            "right": null,
252
            "top": null,
253
            "visibility": null,
254
            "width": null
255
          }
256
        },
257
        "51b1646d7e194c75b1109d16b8291c76": {
258
          "model_module": "@jupyter-widgets/controls",
259
          "model_name": "DescriptionStyleModel",
260
          "model_module_version": "1.5.0",
261
          "state": {
262
            "_model_module": "@jupyter-widgets/controls",
263
            "_model_module_version": "1.5.0",
264
            "_model_name": "DescriptionStyleModel",
265
            "_view_count": null,
266
            "_view_module": "@jupyter-widgets/base",
267
            "_view_module_version": "1.2.0",
268
            "_view_name": "StyleView",
269
            "description_width": ""
270
          }
271
        },
272
        "3efa5c88dc2d491c99678d73e4144eeb": {
273
          "model_module": "@jupyter-widgets/base",
274
          "model_name": "LayoutModel",
275
          "model_module_version": "1.2.0",
276
          "state": {
277
            "_model_module": "@jupyter-widgets/base",
278
            "_model_module_version": "1.2.0",
279
            "_model_name": "LayoutModel",
280
            "_view_count": null,
281
            "_view_module": "@jupyter-widgets/base",
282
            "_view_module_version": "1.2.0",
283
            "_view_name": "LayoutView",
284
            "align_content": null,
285
            "align_items": null,
286
            "align_self": null,
287
            "border": null,
288
            "bottom": null,
289
            "display": null,
290
            "flex": null,
291
            "flex_flow": null,
292
            "grid_area": null,
293
            "grid_auto_columns": null,
294
            "grid_auto_flow": null,
295
            "grid_auto_rows": null,
296
            "grid_column": null,
297
            "grid_gap": null,
298
            "grid_row": null,
299
            "grid_template_areas": null,
300
            "grid_template_columns": null,
301
            "grid_template_rows": null,
302
            "height": null,
303
            "justify_content": null,
304
            "justify_items": null,
305
            "left": null,
306
            "margin": null,
307
            "max_height": null,
308
            "max_width": null,
309
            "min_height": null,
310
            "min_width": null,
311
            "object_fit": null,
312
            "object_position": null,
313
            "order": null,
314
            "overflow": null,
315
            "overflow_x": null,
316
            "overflow_y": null,
317
            "padding": null,
318
            "right": null,
319
            "top": null,
320
            "visibility": null,
321
            "width": null
322
          }
323
        },
324
        "b1dfa66aec6a4e86bff78e3a62905a3c": {
325
          "model_module": "@jupyter-widgets/controls",
326
          "model_name": "DescriptionStyleModel",
327
          "model_module_version": "1.5.0",
328
          "state": {
329
            "_model_module": "@jupyter-widgets/controls",
330
            "_model_module_version": "1.5.0",
331
            "_model_name": "DescriptionStyleModel",
332
            "_view_count": null,
333
            "_view_module": "@jupyter-widgets/base",
334
            "_view_module_version": "1.2.0",
335
            "_view_name": "StyleView",
336
            "description_width": ""
337
          }
338
        },
339
        "5e4cc08b7aa44cacae18fcc4131c174d": {
340
          "model_module": "@jupyter-widgets/base",
341
          "model_name": "LayoutModel",
342
          "model_module_version": "1.2.0",
343
          "state": {
344
            "_model_module": "@jupyter-widgets/base",
345
            "_model_module_version": "1.2.0",
346
            "_model_name": "LayoutModel",
347
            "_view_count": null,
348
            "_view_module": "@jupyter-widgets/base",
349
            "_view_module_version": "1.2.0",
350
            "_view_name": "LayoutView",
351
            "align_content": null,
352
            "align_items": null,
353
            "align_self": null,
354
            "border": null,
355
            "bottom": null,
356
            "display": null,
357
            "flex": null,
358
            "flex_flow": null,
359
            "grid_area": null,
360
            "grid_auto_columns": null,
361
            "grid_auto_flow": null,
362
            "grid_auto_rows": null,
363
            "grid_column": null,
364
            "grid_gap": null,
365
            "grid_row": null,
366
            "grid_template_areas": null,
367
            "grid_template_columns": null,
368
            "grid_template_rows": null,
369
            "height": null,
370
            "justify_content": null,
371
            "justify_items": null,
372
            "left": null,
373
            "margin": null,
374
            "max_height": null,
375
            "max_width": null,
376
            "min_height": null,
377
            "min_width": null,
378
            "object_fit": null,
379
            "object_position": null,
380
            "order": null,
381
            "overflow": null,
382
            "overflow_x": null,
383
            "overflow_y": null,
384
            "padding": null,
385
            "right": null,
386
            "top": null,
387
            "visibility": null,
388
            "width": null
389
          }
390
        },
391
        "813d16aa8a144cf7b3c1b08d096a2b20": {
392
          "model_module": "@jupyter-widgets/controls",
393
          "model_name": "DescriptionStyleModel",
394
          "model_module_version": "1.5.0",
395
          "state": {
396
            "_model_module": "@jupyter-widgets/controls",
397
            "_model_module_version": "1.5.0",
398
            "_model_name": "DescriptionStyleModel",
399
            "_view_count": null,
400
            "_view_module": "@jupyter-widgets/base",
401
            "_view_module_version": "1.2.0",
402
            "_view_name": "StyleView",
403
            "description_width": ""
404
          }
405
        },
406
        "63c15146f75f473394ebcc165ca0d7f6": {
407
          "model_module": "@jupyter-widgets/base",
408
          "model_name": "LayoutModel",
409
          "model_module_version": "1.2.0",
410
          "state": {
411
            "_model_module": "@jupyter-widgets/base",
412
            "_model_module_version": "1.2.0",
413
            "_model_name": "LayoutModel",
414
            "_view_count": null,
415
            "_view_module": "@jupyter-widgets/base",
416
            "_view_module_version": "1.2.0",
417
            "_view_name": "LayoutView",
418
            "align_content": null,
419
            "align_items": null,
420
            "align_self": null,
421
            "border": null,
422
            "bottom": null,
423
            "display": null,
424
            "flex": null,
425
            "flex_flow": null,
426
            "grid_area": null,
427
            "grid_auto_columns": null,
428
            "grid_auto_flow": null,
429
            "grid_auto_rows": null,
430
            "grid_column": null,
431
            "grid_gap": null,
432
            "grid_row": null,
433
            "grid_template_areas": null,
434
            "grid_template_columns": null,
435
            "grid_template_rows": null,
436
            "height": null,
437
            "justify_content": null,
438
            "justify_items": null,
439
            "left": null,
440
            "margin": null,
441
            "max_height": null,
442
            "max_width": null,
443
            "min_height": null,
444
            "min_width": null,
445
            "object_fit": null,
446
            "object_position": null,
447
            "order": null,
448
            "overflow": null,
449
            "overflow_x": null,
450
            "overflow_y": null,
451
            "padding": null,
452
            "right": null,
453
            "top": null,
454
            "visibility": null,
455
            "width": null
456
          }
457
        },
458
        "cc10d97351604ee18918afa1d955a089": {
459
          "model_module": "@jupyter-widgets/controls",
460
          "model_name": "ButtonStyleModel",
461
          "model_module_version": "1.5.0",
462
          "state": {
463
            "_model_module": "@jupyter-widgets/controls",
464
            "_model_module_version": "1.5.0",
465
            "_model_name": "ButtonStyleModel",
466
            "_view_count": null,
467
            "_view_module": "@jupyter-widgets/base",
468
            "_view_module_version": "1.2.0",
469
            "_view_name": "StyleView",
470
            "button_color": null,
471
            "font_weight": ""
472
          }
473
        },
474
        "6ff94a654ed54915b2082197920e89ab": {
475
          "model_module": "@jupyter-widgets/base",
476
          "model_name": "LayoutModel",
477
          "model_module_version": "1.2.0",
478
          "state": {
479
            "_model_module": "@jupyter-widgets/base",
480
            "_model_module_version": "1.2.0",
481
            "_model_name": "LayoutModel",
482
            "_view_count": null,
483
            "_view_module": "@jupyter-widgets/base",
484
            "_view_module_version": "1.2.0",
485
            "_view_name": "LayoutView",
486
            "align_content": null,
487
            "align_items": null,
488
            "align_self": null,
489
            "border": null,
490
            "bottom": null,
491
            "display": null,
492
            "flex": null,
493
            "flex_flow": null,
494
            "grid_area": null,
495
            "grid_auto_columns": null,
496
            "grid_auto_flow": null,
497
            "grid_auto_rows": null,
498
            "grid_column": null,
499
            "grid_gap": null,
500
            "grid_row": null,
501
            "grid_template_areas": null,
502
            "grid_template_columns": null,
503
            "grid_template_rows": null,
504
            "height": null,
505
            "justify_content": null,
506
            "justify_items": null,
507
            "left": null,
508
            "margin": null,
509
            "max_height": null,
510
            "max_width": null,
511
            "min_height": null,
512
            "min_width": null,
513
            "object_fit": null,
514
            "object_position": null,
515
            "order": null,
516
            "overflow": null,
517
            "overflow_x": null,
518
            "overflow_y": null,
519
            "padding": null,
520
            "right": null,
521
            "top": null,
522
            "visibility": null,
523
            "width": null
524
          }
525
        },
526
        "dc9118ad41d247cab135811a183805e8": {
527
          "model_module": "@jupyter-widgets/controls",
528
          "model_name": "DescriptionStyleModel",
529
          "model_module_version": "1.5.0",
530
          "state": {
531
            "_model_module": "@jupyter-widgets/controls",
532
            "_model_module_version": "1.5.0",
533
            "_model_name": "DescriptionStyleModel",
534
            "_view_count": null,
535
            "_view_module": "@jupyter-widgets/base",
536
            "_view_module_version": "1.2.0",
537
            "_view_name": "StyleView",
538
            "description_width": ""
539
          }
540
        },
541
        "3e285ebb0b7d414fb5ab6ee02ccb4f50": {
542
          "model_module": "@jupyter-widgets/controls",
543
          "model_name": "LabelModel",
544
          "model_module_version": "1.5.0",
545
          "state": {
546
            "_dom_classes": [],
547
            "_model_module": "@jupyter-widgets/controls",
548
            "_model_module_version": "1.5.0",
549
            "_model_name": "LabelModel",
550
            "_view_count": null,
551
            "_view_module": "@jupyter-widgets/controls",
552
            "_view_module_version": "1.5.0",
553
            "_view_name": "LabelView",
554
            "description": "",
555
            "description_tooltip": null,
556
            "layout": "IPY_MODEL_ae75d86eb24241d082669a422df4180c",
557
            "placeholder": "​",
558
            "style": "IPY_MODEL_f8e648aa342c43aa9e960622f897e5c5",
559
            "value": "Connecting..."
560
          }
561
        },
562
        "ae75d86eb24241d082669a422df4180c": {
563
          "model_module": "@jupyter-widgets/base",
564
          "model_name": "LayoutModel",
565
          "model_module_version": "1.2.0",
566
          "state": {
567
            "_model_module": "@jupyter-widgets/base",
568
            "_model_module_version": "1.2.0",
569
            "_model_name": "LayoutModel",
570
            "_view_count": null,
571
            "_view_module": "@jupyter-widgets/base",
572
            "_view_module_version": "1.2.0",
573
            "_view_name": "LayoutView",
574
            "align_content": null,
575
            "align_items": null,
576
            "align_self": null,
577
            "border": null,
578
            "bottom": null,
579
            "display": null,
580
            "flex": null,
581
            "flex_flow": null,
582
            "grid_area": null,
583
            "grid_auto_columns": null,
584
            "grid_auto_flow": null,
585
            "grid_auto_rows": null,
586
            "grid_column": null,
587
            "grid_gap": null,
588
            "grid_row": null,
589
            "grid_template_areas": null,
590
            "grid_template_columns": null,
591
            "grid_template_rows": null,
592
            "height": null,
593
            "justify_content": null,
594
            "justify_items": null,
595
            "left": null,
596
            "margin": null,
597
            "max_height": null,
598
            "max_width": null,
599
            "min_height": null,
600
            "min_width": null,
601
            "object_fit": null,
602
            "object_position": null,
603
            "order": null,
604
            "overflow": null,
605
            "overflow_x": null,
606
            "overflow_y": null,
607
            "padding": null,
608
            "right": null,
609
            "top": null,
610
            "visibility": null,
611
            "width": null
612
          }
613
        },
614
        "f8e648aa342c43aa9e960622f897e5c5": {
615
          "model_module": "@jupyter-widgets/controls",
616
          "model_name": "DescriptionStyleModel",
617
          "model_module_version": "1.5.0",
618
          "state": {
619
            "_model_module": "@jupyter-widgets/controls",
620
            "_model_module_version": "1.5.0",
621
            "_model_name": "DescriptionStyleModel",
622
            "_view_count": null,
623
            "_view_module": "@jupyter-widgets/base",
624
            "_view_module_version": "1.2.0",
625
            "_view_name": "StyleView",
626
            "description_width": ""
627
          }
628
        },
629
        "12051bdac0aa466c91122f3cb0e1ab2b": {
630
          "model_module": "@jupyter-widgets/controls",
631
          "model_name": "LabelModel",
632
          "model_module_version": "1.5.0",
633
          "state": {
634
            "_dom_classes": [],
635
            "_model_module": "@jupyter-widgets/controls",
636
            "_model_module_version": "1.5.0",
637
            "_model_name": "LabelModel",
638
            "_view_count": null,
639
            "_view_module": "@jupyter-widgets/controls",
640
            "_view_module_version": "1.5.0",
641
            "_view_name": "LabelView",
642
            "description": "",
643
            "description_tooltip": null,
644
            "layout": "IPY_MODEL_cfbb97be5d284781b35abeca297bbad9",
645
            "placeholder": "​",
646
            "style": "IPY_MODEL_ab04ee5ca65f45fc9368a80847926198",
647
            "value": "Token is valid (permission: write)."
648
          }
649
        },
650
        "e9569646ef72451496087c49a2487ddc": {
651
          "model_module": "@jupyter-widgets/controls",
652
          "model_name": "LabelModel",
653
          "model_module_version": "1.5.0",
654
          "state": {
655
            "_dom_classes": [],
656
            "_model_module": "@jupyter-widgets/controls",
657
            "_model_module_version": "1.5.0",
658
            "_model_name": "LabelModel",
659
            "_view_count": null,
660
            "_view_module": "@jupyter-widgets/controls",
661
            "_view_module_version": "1.5.0",
662
            "_view_name": "LabelView",
663
            "description": "",
664
            "description_tooltip": null,
665
            "layout": "IPY_MODEL_0fd23d208e5942439a7e83797ac9fe64",
666
            "placeholder": "​",
667
            "style": "IPY_MODEL_e1da3e30982746959ec7ebd180a3bbb9",
668
            "value": "Your token has been saved in your configured git credential helpers (store)."
669
          }
670
        },
671
        "23fc55e87153404d90f55930f7f73988": {
672
          "model_module": "@jupyter-widgets/controls",
673
          "model_name": "LabelModel",
674
          "model_module_version": "1.5.0",
675
          "state": {
676
            "_dom_classes": [],
677
            "_model_module": "@jupyter-widgets/controls",
678
            "_model_module_version": "1.5.0",
679
            "_model_name": "LabelModel",
680
            "_view_count": null,
681
            "_view_module": "@jupyter-widgets/controls",
682
            "_view_module_version": "1.5.0",
683
            "_view_name": "LabelView",
684
            "description": "",
685
            "description_tooltip": null,
686
            "layout": "IPY_MODEL_0836d18df07244afb40d2cc2f6a3879e",
687
            "placeholder": "​",
688
            "style": "IPY_MODEL_79189477733f4aff8e62c4cbf318e91b",
689
            "value": "Your token has been saved to /root/.cache/huggingface/token"
690
          }
691
        },
692
        "903957b2c1404703b2e59a2875da77ec": {
693
          "model_module": "@jupyter-widgets/controls",
694
          "model_name": "LabelModel",
695
          "model_module_version": "1.5.0",
696
          "state": {
697
            "_dom_classes": [],
698
            "_model_module": "@jupyter-widgets/controls",
699
            "_model_module_version": "1.5.0",
700
            "_model_name": "LabelModel",
701
            "_view_count": null,
702
            "_view_module": "@jupyter-widgets/controls",
703
            "_view_module_version": "1.5.0",
704
            "_view_name": "LabelView",
705
            "description": "",
706
            "description_tooltip": null,
707
            "layout": "IPY_MODEL_4a4d70a7a8dd4af4b3147161193b1885",
708
            "placeholder": "​",
709
            "style": "IPY_MODEL_b72edebfa2a548b49c47bad5bc7aeecd",
710
            "value": "Login successful"
711
          }
712
        },
713
        "cfbb97be5d284781b35abeca297bbad9": {
714
          "model_module": "@jupyter-widgets/base",
715
          "model_name": "LayoutModel",
716
          "model_module_version": "1.2.0",
717
          "state": {
718
            "_model_module": "@jupyter-widgets/base",
719
            "_model_module_version": "1.2.0",
720
            "_model_name": "LayoutModel",
721
            "_view_count": null,
722
            "_view_module": "@jupyter-widgets/base",
723
            "_view_module_version": "1.2.0",
724
            "_view_name": "LayoutView",
725
            "align_content": null,
726
            "align_items": null,
727
            "align_self": null,
728
            "border": null,
729
            "bottom": null,
730
            "display": null,
731
            "flex": null,
732
            "flex_flow": null,
733
            "grid_area": null,
734
            "grid_auto_columns": null,
735
            "grid_auto_flow": null,
736
            "grid_auto_rows": null,
737
            "grid_column": null,
738
            "grid_gap": null,
739
            "grid_row": null,
740
            "grid_template_areas": null,
741
            "grid_template_columns": null,
742
            "grid_template_rows": null,
743
            "height": null,
744
            "justify_content": null,
745
            "justify_items": null,
746
            "left": null,
747
            "margin": null,
748
            "max_height": null,
749
            "max_width": null,
750
            "min_height": null,
751
            "min_width": null,
752
            "object_fit": null,
753
            "object_position": null,
754
            "order": null,
755
            "overflow": null,
756
            "overflow_x": null,
757
            "overflow_y": null,
758
            "padding": null,
759
            "right": null,
760
            "top": null,
761
            "visibility": null,
762
            "width": null
763
          }
764
        },
765
        "ab04ee5ca65f45fc9368a80847926198": {
766
          "model_module": "@jupyter-widgets/controls",
767
          "model_name": "DescriptionStyleModel",
768
          "model_module_version": "1.5.0",
769
          "state": {
770
            "_model_module": "@jupyter-widgets/controls",
771
            "_model_module_version": "1.5.0",
772
            "_model_name": "DescriptionStyleModel",
773
            "_view_count": null,
774
            "_view_module": "@jupyter-widgets/base",
775
            "_view_module_version": "1.2.0",
776
            "_view_name": "StyleView",
777
            "description_width": ""
778
          }
779
        },
780
        "0fd23d208e5942439a7e83797ac9fe64": {
781
          "model_module": "@jupyter-widgets/base",
782
          "model_name": "LayoutModel",
783
          "model_module_version": "1.2.0",
784
          "state": {
785
            "_model_module": "@jupyter-widgets/base",
786
            "_model_module_version": "1.2.0",
787
            "_model_name": "LayoutModel",
788
            "_view_count": null,
789
            "_view_module": "@jupyter-widgets/base",
790
            "_view_module_version": "1.2.0",
791
            "_view_name": "LayoutView",
792
            "align_content": null,
793
            "align_items": null,
794
            "align_self": null,
795
            "border": null,
796
            "bottom": null,
797
            "display": null,
798
            "flex": null,
799
            "flex_flow": null,
800
            "grid_area": null,
801
            "grid_auto_columns": null,
802
            "grid_auto_flow": null,
803
            "grid_auto_rows": null,
804
            "grid_column": null,
805
            "grid_gap": null,
806
            "grid_row": null,
807
            "grid_template_areas": null,
808
            "grid_template_columns": null,
809
            "grid_template_rows": null,
810
            "height": null,
811
            "justify_content": null,
812
            "justify_items": null,
813
            "left": null,
814
            "margin": null,
815
            "max_height": null,
816
            "max_width": null,
817
            "min_height": null,
818
            "min_width": null,
819
            "object_fit": null,
820
            "object_position": null,
821
            "order": null,
822
            "overflow": null,
823
            "overflow_x": null,
824
            "overflow_y": null,
825
            "padding": null,
826
            "right": null,
827
            "top": null,
828
            "visibility": null,
829
            "width": null
830
          }
831
        },
832
        "e1da3e30982746959ec7ebd180a3bbb9": {
833
          "model_module": "@jupyter-widgets/controls",
834
          "model_name": "DescriptionStyleModel",
835
          "model_module_version": "1.5.0",
836
          "state": {
837
            "_model_module": "@jupyter-widgets/controls",
838
            "_model_module_version": "1.5.0",
839
            "_model_name": "DescriptionStyleModel",
840
            "_view_count": null,
841
            "_view_module": "@jupyter-widgets/base",
842
            "_view_module_version": "1.2.0",
843
            "_view_name": "StyleView",
844
            "description_width": ""
845
          }
846
        },
847
        "0836d18df07244afb40d2cc2f6a3879e": {
848
          "model_module": "@jupyter-widgets/base",
849
          "model_name": "LayoutModel",
850
          "model_module_version": "1.2.0",
851
          "state": {
852
            "_model_module": "@jupyter-widgets/base",
853
            "_model_module_version": "1.2.0",
854
            "_model_name": "LayoutModel",
855
            "_view_count": null,
856
            "_view_module": "@jupyter-widgets/base",
857
            "_view_module_version": "1.2.0",
858
            "_view_name": "LayoutView",
859
            "align_content": null,
860
            "align_items": null,
861
            "align_self": null,
862
            "border": null,
863
            "bottom": null,
864
            "display": null,
865
            "flex": null,
866
            "flex_flow": null,
867
            "grid_area": null,
868
            "grid_auto_columns": null,
869
            "grid_auto_flow": null,
870
            "grid_auto_rows": null,
871
            "grid_column": null,
872
            "grid_gap": null,
873
            "grid_row": null,
874
            "grid_template_areas": null,
875
            "grid_template_columns": null,
876
            "grid_template_rows": null,
877
            "height": null,
878
            "justify_content": null,
879
            "justify_items": null,
880
            "left": null,
881
            "margin": null,
882
            "max_height": null,
883
            "max_width": null,
884
            "min_height": null,
885
            "min_width": null,
886
            "object_fit": null,
887
            "object_position": null,
888
            "order": null,
889
            "overflow": null,
890
            "overflow_x": null,
891
            "overflow_y": null,
892
            "padding": null,
893
            "right": null,
894
            "top": null,
895
            "visibility": null,
896
            "width": null
897
          }
898
        },
899
        "79189477733f4aff8e62c4cbf318e91b": {
900
          "model_module": "@jupyter-widgets/controls",
901
          "model_name": "DescriptionStyleModel",
902
          "model_module_version": "1.5.0",
903
          "state": {
904
            "_model_module": "@jupyter-widgets/controls",
905
            "_model_module_version": "1.5.0",
906
            "_model_name": "DescriptionStyleModel",
907
            "_view_count": null,
908
            "_view_module": "@jupyter-widgets/base",
909
            "_view_module_version": "1.2.0",
910
            "_view_name": "StyleView",
911
            "description_width": ""
912
          }
913
        },
914
        "4a4d70a7a8dd4af4b3147161193b1885": {
915
          "model_module": "@jupyter-widgets/base",
916
          "model_name": "LayoutModel",
917
          "model_module_version": "1.2.0",
918
          "state": {
919
            "_model_module": "@jupyter-widgets/base",
920
            "_model_module_version": "1.2.0",
921
            "_model_name": "LayoutModel",
922
            "_view_count": null,
923
            "_view_module": "@jupyter-widgets/base",
924
            "_view_module_version": "1.2.0",
925
            "_view_name": "LayoutView",
926
            "align_content": null,
927
            "align_items": null,
928
            "align_self": null,
929
            "border": null,
930
            "bottom": null,
931
            "display": null,
932
            "flex": null,
933
            "flex_flow": null,
934
            "grid_area": null,
935
            "grid_auto_columns": null,
936
            "grid_auto_flow": null,
937
            "grid_auto_rows": null,
938
            "grid_column": null,
939
            "grid_gap": null,
940
            "grid_row": null,
941
            "grid_template_areas": null,
942
            "grid_template_columns": null,
943
            "grid_template_rows": null,
944
            "height": null,
945
            "justify_content": null,
946
            "justify_items": null,
947
            "left": null,
948
            "margin": null,
949
            "max_height": null,
950
            "max_width": null,
951
            "min_height": null,
952
            "min_width": null,
953
            "object_fit": null,
954
            "object_position": null,
955
            "order": null,
956
            "overflow": null,
957
            "overflow_x": null,
958
            "overflow_y": null,
959
            "padding": null,
960
            "right": null,
961
            "top": null,
962
            "visibility": null,
963
            "width": null
964
          }
965
        },
966
        "b72edebfa2a548b49c47bad5bc7aeecd": {
967
          "model_module": "@jupyter-widgets/controls",
968
          "model_name": "DescriptionStyleModel",
969
          "model_module_version": "1.5.0",
970
          "state": {
971
            "_model_module": "@jupyter-widgets/controls",
972
            "_model_module_version": "1.5.0",
973
            "_model_name": "DescriptionStyleModel",
974
            "_view_count": null,
975
            "_view_module": "@jupyter-widgets/base",
976
            "_view_module_version": "1.2.0",
977
            "_view_name": "StyleView",
978
            "description_width": ""
979
          }
980
        },
981
        "98916f7a1809458e8ebc568f770ed544": {
982
          "model_module": "@jupyter-widgets/controls",
983
          "model_name": "HBoxModel",
984
          "model_module_version": "1.5.0",
985
          "state": {
986
            "_dom_classes": [],
987
            "_model_module": "@jupyter-widgets/controls",
988
            "_model_module_version": "1.5.0",
989
            "_model_name": "HBoxModel",
990
            "_view_count": null,
991
            "_view_module": "@jupyter-widgets/controls",
992
            "_view_module_version": "1.5.0",
993
            "_view_name": "HBoxView",
994
            "box_style": "",
995
            "children": [
996
              "IPY_MODEL_2c6ba20e4b384d6fa46fbd832daf36e2",
997
              "IPY_MODEL_a6920b63b1cb4c1297bc5a18c7e30f7e",
998
              "IPY_MODEL_c18e0920993f4189ab927b167fb9a046"
999
            ],
1000
            "layout": "IPY_MODEL_13565f1b6e6e4fa7a365160dad1cdb42"
1001
          }
1002
        },
1003
        "2c6ba20e4b384d6fa46fbd832daf36e2": {
1004
          "model_module": "@jupyter-widgets/controls",
1005
          "model_name": "HTMLModel",
1006
          "model_module_version": "1.5.0",
1007
          "state": {
1008
            "_dom_classes": [],
1009
            "_model_module": "@jupyter-widgets/controls",
1010
            "_model_module_version": "1.5.0",
1011
            "_model_name": "HTMLModel",
1012
            "_view_count": null,
1013
            "_view_module": "@jupyter-widgets/controls",
1014
            "_view_module_version": "1.5.0",
1015
            "_view_name": "HTMLView",
1016
            "description": "",
1017
            "description_tooltip": null,
1018
            "layout": "IPY_MODEL_fa3308e0b8fb469d8549199e8bfe2278",
1019
            "placeholder": "​",
1020
            "style": "IPY_MODEL_e7672f0406bd4f2c8a0ef83fd390e49d",
1021
            "value": "cal_data.safetensors: 100%"
1022
          }
1023
        },
1024
        "a6920b63b1cb4c1297bc5a18c7e30f7e": {
1025
          "model_module": "@jupyter-widgets/controls",
1026
          "model_name": "FloatProgressModel",
1027
          "model_module_version": "1.5.0",
1028
          "state": {
1029
            "_dom_classes": [],
1030
            "_model_module": "@jupyter-widgets/controls",
1031
            "_model_module_version": "1.5.0",
1032
            "_model_name": "FloatProgressModel",
1033
            "_view_count": null,
1034
            "_view_module": "@jupyter-widgets/controls",
1035
            "_view_module_version": "1.5.0",
1036
            "_view_name": "ProgressView",
1037
            "bar_style": "success",
1038
            "description": "",
1039
            "description_tooltip": null,
1040
            "layout": "IPY_MODEL_22b9c33a7c084ccd9e8878bda3748486",
1041
            "max": 1638488,
1042
            "min": 0,
1043
            "orientation": "horizontal",
1044
            "style": "IPY_MODEL_2d6aa1ecdf7444b4b4cb81515d3654be",
1045
            "value": 1638488
1046
          }
1047
        },
1048
        "c18e0920993f4189ab927b167fb9a046": {
1049
          "model_module": "@jupyter-widgets/controls",
1050
          "model_name": "HTMLModel",
1051
          "model_module_version": "1.5.0",
1052
          "state": {
1053
            "_dom_classes": [],
1054
            "_model_module": "@jupyter-widgets/controls",
1055
            "_model_module_version": "1.5.0",
1056
            "_model_name": "HTMLModel",
1057
            "_view_count": null,
1058
            "_view_module": "@jupyter-widgets/controls",
1059
            "_view_module_version": "1.5.0",
1060
            "_view_name": "HTMLView",
1061
            "description": "",
1062
            "description_tooltip": null,
1063
            "layout": "IPY_MODEL_6cedbad90ca9423f85a48d7e4073a378",
1064
            "placeholder": "​",
1065
            "style": "IPY_MODEL_c893eb5da4e34e4999981b3810a4205b",
1066
            "value": " 1.64M/1.64M [00:01&lt;00:00, 22.1kB/s]"
1067
          }
1068
        },
1069
        "13565f1b6e6e4fa7a365160dad1cdb42": {
1070
          "model_module": "@jupyter-widgets/base",
1071
          "model_name": "LayoutModel",
1072
          "model_module_version": "1.2.0",
1073
          "state": {
1074
            "_model_module": "@jupyter-widgets/base",
1075
            "_model_module_version": "1.2.0",
1076
            "_model_name": "LayoutModel",
1077
            "_view_count": null,
1078
            "_view_module": "@jupyter-widgets/base",
1079
            "_view_module_version": "1.2.0",
1080
            "_view_name": "LayoutView",
1081
            "align_content": null,
1082
            "align_items": null,
1083
            "align_self": null,
1084
            "border": null,
1085
            "bottom": null,
1086
            "display": null,
1087
            "flex": null,
1088
            "flex_flow": null,
1089
            "grid_area": null,
1090
            "grid_auto_columns": null,
1091
            "grid_auto_flow": null,
1092
            "grid_auto_rows": null,
1093
            "grid_column": null,
1094
            "grid_gap": null,
1095
            "grid_row": null,
1096
            "grid_template_areas": null,
1097
            "grid_template_columns": null,
1098
            "grid_template_rows": null,
1099
            "height": null,
1100
            "justify_content": null,
1101
            "justify_items": null,
1102
            "left": null,
1103
            "margin": null,
1104
            "max_height": null,
1105
            "max_width": null,
1106
            "min_height": null,
1107
            "min_width": null,
1108
            "object_fit": null,
1109
            "object_position": null,
1110
            "order": null,
1111
            "overflow": null,
1112
            "overflow_x": null,
1113
            "overflow_y": null,
1114
            "padding": null,
1115
            "right": null,
1116
            "top": null,
1117
            "visibility": null,
1118
            "width": null
1119
          }
1120
        },
1121
        "fa3308e0b8fb469d8549199e8bfe2278": {
1122
          "model_module": "@jupyter-widgets/base",
1123
          "model_name": "LayoutModel",
1124
          "model_module_version": "1.2.0",
1125
          "state": {
1126
            "_model_module": "@jupyter-widgets/base",
1127
            "_model_module_version": "1.2.0",
1128
            "_model_name": "LayoutModel",
1129
            "_view_count": null,
1130
            "_view_module": "@jupyter-widgets/base",
1131
            "_view_module_version": "1.2.0",
1132
            "_view_name": "LayoutView",
1133
            "align_content": null,
1134
            "align_items": null,
1135
            "align_self": null,
1136
            "border": null,
1137
            "bottom": null,
1138
            "display": null,
1139
            "flex": null,
1140
            "flex_flow": null,
1141
            "grid_area": null,
1142
            "grid_auto_columns": null,
1143
            "grid_auto_flow": null,
1144
            "grid_auto_rows": null,
1145
            "grid_column": null,
1146
            "grid_gap": null,
1147
            "grid_row": null,
1148
            "grid_template_areas": null,
1149
            "grid_template_columns": null,
1150
            "grid_template_rows": null,
1151
            "height": null,
1152
            "justify_content": null,
1153
            "justify_items": null,
1154
            "left": null,
1155
            "margin": null,
1156
            "max_height": null,
1157
            "max_width": null,
1158
            "min_height": null,
1159
            "min_width": null,
1160
            "object_fit": null,
1161
            "object_position": null,
1162
            "order": null,
1163
            "overflow": null,
1164
            "overflow_x": null,
1165
            "overflow_y": null,
1166
            "padding": null,
1167
            "right": null,
1168
            "top": null,
1169
            "visibility": null,
1170
            "width": null
1171
          }
1172
        },
1173
        "e7672f0406bd4f2c8a0ef83fd390e49d": {
1174
          "model_module": "@jupyter-widgets/controls",
1175
          "model_name": "DescriptionStyleModel",
1176
          "model_module_version": "1.5.0",
1177
          "state": {
1178
            "_model_module": "@jupyter-widgets/controls",
1179
            "_model_module_version": "1.5.0",
1180
            "_model_name": "DescriptionStyleModel",
1181
            "_view_count": null,
1182
            "_view_module": "@jupyter-widgets/base",
1183
            "_view_module_version": "1.2.0",
1184
            "_view_name": "StyleView",
1185
            "description_width": ""
1186
          }
1187
        },
1188
        "22b9c33a7c084ccd9e8878bda3748486": {
1189
          "model_module": "@jupyter-widgets/base",
1190
          "model_name": "LayoutModel",
1191
          "model_module_version": "1.2.0",
1192
          "state": {
1193
            "_model_module": "@jupyter-widgets/base",
1194
            "_model_module_version": "1.2.0",
1195
            "_model_name": "LayoutModel",
1196
            "_view_count": null,
1197
            "_view_module": "@jupyter-widgets/base",
1198
            "_view_module_version": "1.2.0",
1199
            "_view_name": "LayoutView",
1200
            "align_content": null,
1201
            "align_items": null,
1202
            "align_self": null,
1203
            "border": null,
1204
            "bottom": null,
1205
            "display": null,
1206
            "flex": null,
1207
            "flex_flow": null,
1208
            "grid_area": null,
1209
            "grid_auto_columns": null,
1210
            "grid_auto_flow": null,
1211
            "grid_auto_rows": null,
1212
            "grid_column": null,
1213
            "grid_gap": null,
1214
            "grid_row": null,
1215
            "grid_template_areas": null,
1216
            "grid_template_columns": null,
1217
            "grid_template_rows": null,
1218
            "height": null,
1219
            "justify_content": null,
1220
            "justify_items": null,
1221
            "left": null,
1222
            "margin": null,
1223
            "max_height": null,
1224
            "max_width": null,
1225
            "min_height": null,
1226
            "min_width": null,
1227
            "object_fit": null,
1228
            "object_position": null,
1229
            "order": null,
1230
            "overflow": null,
1231
            "overflow_x": null,
1232
            "overflow_y": null,
1233
            "padding": null,
1234
            "right": null,
1235
            "top": null,
1236
            "visibility": null,
1237
            "width": null
1238
          }
1239
        },
1240
        "2d6aa1ecdf7444b4b4cb81515d3654be": {
1241
          "model_module": "@jupyter-widgets/controls",
1242
          "model_name": "ProgressStyleModel",
1243
          "model_module_version": "1.5.0",
1244
          "state": {
1245
            "_model_module": "@jupyter-widgets/controls",
1246
            "_model_module_version": "1.5.0",
1247
            "_model_name": "ProgressStyleModel",
1248
            "_view_count": null,
1249
            "_view_module": "@jupyter-widgets/base",
1250
            "_view_module_version": "1.2.0",
1251
            "_view_name": "StyleView",
1252
            "bar_color": null,
1253
            "description_width": ""
1254
          }
1255
        },
1256
        "6cedbad90ca9423f85a48d7e4073a378": {
1257
          "model_module": "@jupyter-widgets/base",
1258
          "model_name": "LayoutModel",
1259
          "model_module_version": "1.2.0",
1260
          "state": {
1261
            "_model_module": "@jupyter-widgets/base",
1262
            "_model_module_version": "1.2.0",
1263
            "_model_name": "LayoutModel",
1264
            "_view_count": null,
1265
            "_view_module": "@jupyter-widgets/base",
1266
            "_view_module_version": "1.2.0",
1267
            "_view_name": "LayoutView",
1268
            "align_content": null,
1269
            "align_items": null,
1270
            "align_self": null,
1271
            "border": null,
1272
            "bottom": null,
1273
            "display": null,
1274
            "flex": null,
1275
            "flex_flow": null,
1276
            "grid_area": null,
1277
            "grid_auto_columns": null,
1278
            "grid_auto_flow": null,
1279
            "grid_auto_rows": null,
1280
            "grid_column": null,
1281
            "grid_gap": null,
1282
            "grid_row": null,
1283
            "grid_template_areas": null,
1284
            "grid_template_columns": null,
1285
            "grid_template_rows": null,
1286
            "height": null,
1287
            "justify_content": null,
1288
            "justify_items": null,
1289
            "left": null,
1290
            "margin": null,
1291
            "max_height": null,
1292
            "max_width": null,
1293
            "min_height": null,
1294
            "min_width": null,
1295
            "object_fit": null,
1296
            "object_position": null,
1297
            "order": null,
1298
            "overflow": null,
1299
            "overflow_x": null,
1300
            "overflow_y": null,
1301
            "padding": null,
1302
            "right": null,
1303
            "top": null,
1304
            "visibility": null,
1305
            "width": null
1306
          }
1307
        },
1308
        "c893eb5da4e34e4999981b3810a4205b": {
1309
          "model_module": "@jupyter-widgets/controls",
1310
          "model_name": "DescriptionStyleModel",
1311
          "model_module_version": "1.5.0",
1312
          "state": {
1313
            "_model_module": "@jupyter-widgets/controls",
1314
            "_model_module_version": "1.5.0",
1315
            "_model_name": "DescriptionStyleModel",
1316
            "_view_count": null,
1317
            "_view_module": "@jupyter-widgets/base",
1318
            "_view_module_version": "1.2.0",
1319
            "_view_name": "StyleView",
1320
            "description_width": ""
1321
          }
1322
        },
1323
        "2a5efce36f38406189e82e2e27b06bab": {
1324
          "model_module": "@jupyter-widgets/controls",
1325
          "model_name": "HBoxModel",
1326
          "model_module_version": "1.5.0",
1327
          "state": {
1328
            "_dom_classes": [],
1329
            "_model_module": "@jupyter-widgets/controls",
1330
            "_model_module_version": "1.5.0",
1331
            "_model_name": "HBoxModel",
1332
            "_view_count": null,
1333
            "_view_module": "@jupyter-widgets/controls",
1334
            "_view_module_version": "1.5.0",
1335
            "_view_name": "HBoxView",
1336
            "box_style": "",
1337
            "children": [
1338
              "IPY_MODEL_3c828089249743e6aa4f3ee60f77caee",
1339
              "IPY_MODEL_543b02a2098043ca849ecdda4f4c7a81",
1340
              "IPY_MODEL_9b076b5c6cf74e56abb01cbcb59d1deb"
1341
            ],
1342
            "layout": "IPY_MODEL_ac08f05888c64726aabcb9a1cfd65aba"
1343
          }
1344
        },
1345
        "3c828089249743e6aa4f3ee60f77caee": {
1346
          "model_module": "@jupyter-widgets/controls",
1347
          "model_name": "HTMLModel",
1348
          "model_module_version": "1.5.0",
1349
          "state": {
1350
            "_dom_classes": [],
1351
            "_model_module": "@jupyter-widgets/controls",
1352
            "_model_module_version": "1.5.0",
1353
            "_model_name": "HTMLModel",
1354
            "_view_count": null,
1355
            "_view_module": "@jupyter-widgets/controls",
1356
            "_view_module_version": "1.5.0",
1357
            "_view_name": "HTMLView",
1358
            "description": "",
1359
            "description_tooltip": null,
1360
            "layout": "IPY_MODEL_4f48b906c779402187567aad8b4ba488",
1361
            "placeholder": "​",
1362
            "style": "IPY_MODEL_e004498b56524804b28661cde5fdce81",
1363
            "value": "output.safetensors: 100%"
1364
          }
1365
        },
1366
        "543b02a2098043ca849ecdda4f4c7a81": {
1367
          "model_module": "@jupyter-widgets/controls",
1368
          "model_name": "FloatProgressModel",
1369
          "model_module_version": "1.5.0",
1370
          "state": {
1371
            "_dom_classes": [],
1372
            "_model_module": "@jupyter-widgets/controls",
1373
            "_model_module_version": "1.5.0",
1374
            "_model_name": "FloatProgressModel",
1375
            "_view_count": null,
1376
            "_view_module": "@jupyter-widgets/controls",
1377
            "_view_module_version": "1.5.0",
1378
            "_view_name": "ProgressView",
1379
            "bar_style": "success",
1380
            "description": "",
1381
            "description_tooltip": null,
1382
            "layout": "IPY_MODEL_9931d545676d49039aba007f13904155",
1383
            "max": 4735018016,
1384
            "min": 0,
1385
            "orientation": "horizontal",
1386
            "style": "IPY_MODEL_130049623d6744dcac8a7ffa25e1e1d1",
1387
            "value": 4735018016
1388
          }
1389
        },
1390
        "9b076b5c6cf74e56abb01cbcb59d1deb": {
1391
          "model_module": "@jupyter-widgets/controls",
1392
          "model_name": "HTMLModel",
1393
          "model_module_version": "1.5.0",
1394
          "state": {
1395
            "_dom_classes": [],
1396
            "_model_module": "@jupyter-widgets/controls",
1397
            "_model_module_version": "1.5.0",
1398
            "_model_name": "HTMLModel",
1399
            "_view_count": null,
1400
            "_view_module": "@jupyter-widgets/controls",
1401
            "_view_module_version": "1.5.0",
1402
            "_view_name": "HTMLView",
1403
            "description": "",
1404
            "description_tooltip": null,
1405
            "layout": "IPY_MODEL_f48ddd7d4d304e10b3fabc3cdc541dbf",
1406
            "placeholder": "​",
1407
            "style": "IPY_MODEL_bcdd93e578fd49e8b1bb76f43bde3483",
1408
            "value": " 4.74G/4.74G [02:21&lt;00:00, 32.3MB/s]"
1409
          }
1410
        },
1411
        "ac08f05888c64726aabcb9a1cfd65aba": {
1412
          "model_module": "@jupyter-widgets/base",
1413
          "model_name": "LayoutModel",
1414
          "model_module_version": "1.2.0",
1415
          "state": {
1416
            "_model_module": "@jupyter-widgets/base",
1417
            "_model_module_version": "1.2.0",
1418
            "_model_name": "LayoutModel",
1419
            "_view_count": null,
1420
            "_view_module": "@jupyter-widgets/base",
1421
            "_view_module_version": "1.2.0",
1422
            "_view_name": "LayoutView",
1423
            "align_content": null,
1424
            "align_items": null,
1425
            "align_self": null,
1426
            "border": null,
1427
            "bottom": null,
1428
            "display": null,
1429
            "flex": null,
1430
            "flex_flow": null,
1431
            "grid_area": null,
1432
            "grid_auto_columns": null,
1433
            "grid_auto_flow": null,
1434
            "grid_auto_rows": null,
1435
            "grid_column": null,
1436
            "grid_gap": null,
1437
            "grid_row": null,
1438
            "grid_template_areas": null,
1439
            "grid_template_columns": null,
1440
            "grid_template_rows": null,
1441
            "height": null,
1442
            "justify_content": null,
1443
            "justify_items": null,
1444
            "left": null,
1445
            "margin": null,
1446
            "max_height": null,
1447
            "max_width": null,
1448
            "min_height": null,
1449
            "min_width": null,
1450
            "object_fit": null,
1451
            "object_position": null,
1452
            "order": null,
1453
            "overflow": null,
1454
            "overflow_x": null,
1455
            "overflow_y": null,
1456
            "padding": null,
1457
            "right": null,
1458
            "top": null,
1459
            "visibility": null,
1460
            "width": null
1461
          }
1462
        },
1463
        "4f48b906c779402187567aad8b4ba488": {
1464
          "model_module": "@jupyter-widgets/base",
1465
          "model_name": "LayoutModel",
1466
          "model_module_version": "1.2.0",
1467
          "state": {
1468
            "_model_module": "@jupyter-widgets/base",
1469
            "_model_module_version": "1.2.0",
1470
            "_model_name": "LayoutModel",
1471
            "_view_count": null,
1472
            "_view_module": "@jupyter-widgets/base",
1473
            "_view_module_version": "1.2.0",
1474
            "_view_name": "LayoutView",
1475
            "align_content": null,
1476
            "align_items": null,
1477
            "align_self": null,
1478
            "border": null,
1479
            "bottom": null,
1480
            "display": null,
1481
            "flex": null,
1482
            "flex_flow": null,
1483
            "grid_area": null,
1484
            "grid_auto_columns": null,
1485
            "grid_auto_flow": null,
1486
            "grid_auto_rows": null,
1487
            "grid_column": null,
1488
            "grid_gap": null,
1489
            "grid_row": null,
1490
            "grid_template_areas": null,
1491
            "grid_template_columns": null,
1492
            "grid_template_rows": null,
1493
            "height": null,
1494
            "justify_content": null,
1495
            "justify_items": null,
1496
            "left": null,
1497
            "margin": null,
1498
            "max_height": null,
1499
            "max_width": null,
1500
            "min_height": null,
1501
            "min_width": null,
1502
            "object_fit": null,
1503
            "object_position": null,
1504
            "order": null,
1505
            "overflow": null,
1506
            "overflow_x": null,
1507
            "overflow_y": null,
1508
            "padding": null,
1509
            "right": null,
1510
            "top": null,
1511
            "visibility": null,
1512
            "width": null
1513
          }
1514
        },
1515
        "e004498b56524804b28661cde5fdce81": {
1516
          "model_module": "@jupyter-widgets/controls",
1517
          "model_name": "DescriptionStyleModel",
1518
          "model_module_version": "1.5.0",
1519
          "state": {
1520
            "_model_module": "@jupyter-widgets/controls",
1521
            "_model_module_version": "1.5.0",
1522
            "_model_name": "DescriptionStyleModel",
1523
            "_view_count": null,
1524
            "_view_module": "@jupyter-widgets/base",
1525
            "_view_module_version": "1.2.0",
1526
            "_view_name": "StyleView",
1527
            "description_width": ""
1528
          }
1529
        },
1530
        "9931d545676d49039aba007f13904155": {
1531
          "model_module": "@jupyter-widgets/base",
1532
          "model_name": "LayoutModel",
1533
          "model_module_version": "1.2.0",
1534
          "state": {
1535
            "_model_module": "@jupyter-widgets/base",
1536
            "_model_module_version": "1.2.0",
1537
            "_model_name": "LayoutModel",
1538
            "_view_count": null,
1539
            "_view_module": "@jupyter-widgets/base",
1540
            "_view_module_version": "1.2.0",
1541
            "_view_name": "LayoutView",
1542
            "align_content": null,
1543
            "align_items": null,
1544
            "align_self": null,
1545
            "border": null,
1546
            "bottom": null,
1547
            "display": null,
1548
            "flex": null,
1549
            "flex_flow": null,
1550
            "grid_area": null,
1551
            "grid_auto_columns": null,
1552
            "grid_auto_flow": null,
1553
            "grid_auto_rows": null,
1554
            "grid_column": null,
1555
            "grid_gap": null,
1556
            "grid_row": null,
1557
            "grid_template_areas": null,
1558
            "grid_template_columns": null,
1559
            "grid_template_rows": null,
1560
            "height": null,
1561
            "justify_content": null,
1562
            "justify_items": null,
1563
            "left": null,
1564
            "margin": null,
1565
            "max_height": null,
1566
            "max_width": null,
1567
            "min_height": null,
1568
            "min_width": null,
1569
            "object_fit": null,
1570
            "object_position": null,
1571
            "order": null,
1572
            "overflow": null,
1573
            "overflow_x": null,
1574
            "overflow_y": null,
1575
            "padding": null,
1576
            "right": null,
1577
            "top": null,
1578
            "visibility": null,
1579
            "width": null
1580
          }
1581
        },
1582
        "130049623d6744dcac8a7ffa25e1e1d1": {
1583
          "model_module": "@jupyter-widgets/controls",
1584
          "model_name": "ProgressStyleModel",
1585
          "model_module_version": "1.5.0",
1586
          "state": {
1587
            "_model_module": "@jupyter-widgets/controls",
1588
            "_model_module_version": "1.5.0",
1589
            "_model_name": "ProgressStyleModel",
1590
            "_view_count": null,
1591
            "_view_module": "@jupyter-widgets/base",
1592
            "_view_module_version": "1.2.0",
1593
            "_view_name": "StyleView",
1594
            "bar_color": null,
1595
            "description_width": ""
1596
          }
1597
        },
1598
        "f48ddd7d4d304e10b3fabc3cdc541dbf": {
1599
          "model_module": "@jupyter-widgets/base",
1600
          "model_name": "LayoutModel",
1601
          "model_module_version": "1.2.0",
1602
          "state": {
1603
            "_model_module": "@jupyter-widgets/base",
1604
            "_model_module_version": "1.2.0",
1605
            "_model_name": "LayoutModel",
1606
            "_view_count": null,
1607
            "_view_module": "@jupyter-widgets/base",
1608
            "_view_module_version": "1.2.0",
1609
            "_view_name": "LayoutView",
1610
            "align_content": null,
1611
            "align_items": null,
1612
            "align_self": null,
1613
            "border": null,
1614
            "bottom": null,
1615
            "display": null,
1616
            "flex": null,
1617
            "flex_flow": null,
1618
            "grid_area": null,
1619
            "grid_auto_columns": null,
1620
            "grid_auto_flow": null,
1621
            "grid_auto_rows": null,
1622
            "grid_column": null,
1623
            "grid_gap": null,
1624
            "grid_row": null,
1625
            "grid_template_areas": null,
1626
            "grid_template_columns": null,
1627
            "grid_template_rows": null,
1628
            "height": null,
1629
            "justify_content": null,
1630
            "justify_items": null,
1631
            "left": null,
1632
            "margin": null,
1633
            "max_height": null,
1634
            "max_width": null,
1635
            "min_height": null,
1636
            "min_width": null,
1637
            "object_fit": null,
1638
            "object_position": null,
1639
            "order": null,
1640
            "overflow": null,
1641
            "overflow_x": null,
1642
            "overflow_y": null,
1643
            "padding": null,
1644
            "right": null,
1645
            "top": null,
1646
            "visibility": null,
1647
            "width": null
1648
          }
1649
        },
1650
        "bcdd93e578fd49e8b1bb76f43bde3483": {
1651
          "model_module": "@jupyter-widgets/controls",
1652
          "model_name": "DescriptionStyleModel",
1653
          "model_module_version": "1.5.0",
1654
          "state": {
1655
            "_model_module": "@jupyter-widgets/controls",
1656
            "_model_module_version": "1.5.0",
1657
            "_model_name": "DescriptionStyleModel",
1658
            "_view_count": null,
1659
            "_view_module": "@jupyter-widgets/base",
1660
            "_view_module_version": "1.2.0",
1661
            "_view_name": "StyleView",
1662
            "description_width": ""
1663
          }
1664
        },
1665
        "a051f03b2e8340dea8b8d8f0389f1d76": {
1666
          "model_module": "@jupyter-widgets/controls",
1667
          "model_name": "HBoxModel",
1668
          "model_module_version": "1.5.0",
1669
          "state": {
1670
            "_dom_classes": [],
1671
            "_model_module": "@jupyter-widgets/controls",
1672
            "_model_module_version": "1.5.0",
1673
            "_model_name": "HBoxModel",
1674
            "_view_count": null,
1675
            "_view_module": "@jupyter-widgets/controls",
1676
            "_view_module_version": "1.5.0",
1677
            "_view_name": "HBoxView",
1678
            "box_style": "",
1679
            "children": [
1680
              "IPY_MODEL_17c15d87496d4e5ea25814806b8606ea",
1681
              "IPY_MODEL_71093ecee7ac45798d8bcb924af2906c",
1682
              "IPY_MODEL_5a0d9471e6cd4f2988f042c4a4e48a3d"
1683
            ],
1684
            "layout": "IPY_MODEL_841d7197d6324552a0fbb6d6f5ac7601"
1685
          }
1686
        },
1687
        "17c15d87496d4e5ea25814806b8606ea": {
1688
          "model_module": "@jupyter-widgets/controls",
1689
          "model_name": "HTMLModel",
1690
          "model_module_version": "1.5.0",
1691
          "state": {
1692
            "_dom_classes": [],
1693
            "_model_module": "@jupyter-widgets/controls",
1694
            "_model_module_version": "1.5.0",
1695
            "_model_name": "HTMLModel",
1696
            "_view_count": null,
1697
            "_view_module": "@jupyter-widgets/controls",
1698
            "_view_module_version": "1.5.0",
1699
            "_view_name": "HTMLView",
1700
            "description": "",
1701
            "description_tooltip": null,
1702
            "layout": "IPY_MODEL_3c3d9d10ee9e466ba170b3dd3aa3ecdd",
1703
            "placeholder": "​",
1704
            "style": "IPY_MODEL_fa9d061965d74d0eb6d728c1f4058845",
1705
            "value": "Upload 5 LFS files: 100%"
1706
          }
1707
        },
1708
        "71093ecee7ac45798d8bcb924af2906c": {
1709
          "model_module": "@jupyter-widgets/controls",
1710
          "model_name": "FloatProgressModel",
1711
          "model_module_version": "1.5.0",
1712
          "state": {
1713
            "_dom_classes": [],
1714
            "_model_module": "@jupyter-widgets/controls",
1715
            "_model_module_version": "1.5.0",
1716
            "_model_name": "FloatProgressModel",
1717
            "_view_count": null,
1718
            "_view_module": "@jupyter-widgets/controls",
1719
            "_view_module_version": "1.5.0",
1720
            "_view_name": "ProgressView",
1721
            "bar_style": "success",
1722
            "description": "",
1723
            "description_tooltip": null,
1724
            "layout": "IPY_MODEL_62de7ed888614d26875a0ecd99cb996f",
1725
            "max": 5,
1726
            "min": 0,
1727
            "orientation": "horizontal",
1728
            "style": "IPY_MODEL_89dc60db3b9a4a1587b00130ffde2311",
1729
            "value": 5
1730
          }
1731
        },
1732
        "5a0d9471e6cd4f2988f042c4a4e48a3d": {
1733
          "model_module": "@jupyter-widgets/controls",
1734
          "model_name": "HTMLModel",
1735
          "model_module_version": "1.5.0",
1736
          "state": {
1737
            "_dom_classes": [],
1738
            "_model_module": "@jupyter-widgets/controls",
1739
            "_model_module_version": "1.5.0",
1740
            "_model_name": "HTMLModel",
1741
            "_view_count": null,
1742
            "_view_module": "@jupyter-widgets/controls",
1743
            "_view_module_version": "1.5.0",
1744
            "_view_name": "HTMLView",
1745
            "description": "",
1746
            "description_tooltip": null,
1747
            "layout": "IPY_MODEL_9d0851b2c54c4e5cb635cd2652890824",
1748
            "placeholder": "​",
1749
            "style": "IPY_MODEL_7a89919a4de9454aa8a7c134f1b1fa3d",
1750
            "value": " 5/5 [02:22&lt;00:00, 57.57s/it]"
1751
          }
1752
        },
1753
        "841d7197d6324552a0fbb6d6f5ac7601": {
1754
          "model_module": "@jupyter-widgets/base",
1755
          "model_name": "LayoutModel",
1756
          "model_module_version": "1.2.0",
1757
          "state": {
1758
            "_model_module": "@jupyter-widgets/base",
1759
            "_model_module_version": "1.2.0",
1760
            "_model_name": "LayoutModel",
1761
            "_view_count": null,
1762
            "_view_module": "@jupyter-widgets/base",
1763
            "_view_module_version": "1.2.0",
1764
            "_view_name": "LayoutView",
1765
            "align_content": null,
1766
            "align_items": null,
1767
            "align_self": null,
1768
            "border": null,
1769
            "bottom": null,
1770
            "display": null,
1771
            "flex": null,
1772
            "flex_flow": null,
1773
            "grid_area": null,
1774
            "grid_auto_columns": null,
1775
            "grid_auto_flow": null,
1776
            "grid_auto_rows": null,
1777
            "grid_column": null,
1778
            "grid_gap": null,
1779
            "grid_row": null,
1780
            "grid_template_areas": null,
1781
            "grid_template_columns": null,
1782
            "grid_template_rows": null,
1783
            "height": null,
1784
            "justify_content": null,
1785
            "justify_items": null,
1786
            "left": null,
1787
            "margin": null,
1788
            "max_height": null,
1789
            "max_width": null,
1790
            "min_height": null,
1791
            "min_width": null,
1792
            "object_fit": null,
1793
            "object_position": null,
1794
            "order": null,
1795
            "overflow": null,
1796
            "overflow_x": null,
1797
            "overflow_y": null,
1798
            "padding": null,
1799
            "right": null,
1800
            "top": null,
1801
            "visibility": null,
1802
            "width": null
1803
          }
1804
        },
1805
        "3c3d9d10ee9e466ba170b3dd3aa3ecdd": {
1806
          "model_module": "@jupyter-widgets/base",
1807
          "model_name": "LayoutModel",
1808
          "model_module_version": "1.2.0",
1809
          "state": {
1810
            "_model_module": "@jupyter-widgets/base",
1811
            "_model_module_version": "1.2.0",
1812
            "_model_name": "LayoutModel",
1813
            "_view_count": null,
1814
            "_view_module": "@jupyter-widgets/base",
1815
            "_view_module_version": "1.2.0",
1816
            "_view_name": "LayoutView",
1817
            "align_content": null,
1818
            "align_items": null,
1819
            "align_self": null,
1820
            "border": null,
1821
            "bottom": null,
1822
            "display": null,
1823
            "flex": null,
1824
            "flex_flow": null,
1825
            "grid_area": null,
1826
            "grid_auto_columns": null,
1827
            "grid_auto_flow": null,
1828
            "grid_auto_rows": null,
1829
            "grid_column": null,
1830
            "grid_gap": null,
1831
            "grid_row": null,
1832
            "grid_template_areas": null,
1833
            "grid_template_columns": null,
1834
            "grid_template_rows": null,
1835
            "height": null,
1836
            "justify_content": null,
1837
            "justify_items": null,
1838
            "left": null,
1839
            "margin": null,
1840
            "max_height": null,
1841
            "max_width": null,
1842
            "min_height": null,
1843
            "min_width": null,
1844
            "object_fit": null,
1845
            "object_position": null,
1846
            "order": null,
1847
            "overflow": null,
1848
            "overflow_x": null,
1849
            "overflow_y": null,
1850
            "padding": null,
1851
            "right": null,
1852
            "top": null,
1853
            "visibility": null,
1854
            "width": null
1855
          }
1856
        },
1857
        "fa9d061965d74d0eb6d728c1f4058845": {
1858
          "model_module": "@jupyter-widgets/controls",
1859
          "model_name": "DescriptionStyleModel",
1860
          "model_module_version": "1.5.0",
1861
          "state": {
1862
            "_model_module": "@jupyter-widgets/controls",
1863
            "_model_module_version": "1.5.0",
1864
            "_model_name": "DescriptionStyleModel",
1865
            "_view_count": null,
1866
            "_view_module": "@jupyter-widgets/base",
1867
            "_view_module_version": "1.2.0",
1868
            "_view_name": "StyleView",
1869
            "description_width": ""
1870
          }
1871
        },
1872
        "62de7ed888614d26875a0ecd99cb996f": {
1873
          "model_module": "@jupyter-widgets/base",
1874
          "model_name": "LayoutModel",
1875
          "model_module_version": "1.2.0",
1876
          "state": {
1877
            "_model_module": "@jupyter-widgets/base",
1878
            "_model_module_version": "1.2.0",
1879
            "_model_name": "LayoutModel",
1880
            "_view_count": null,
1881
            "_view_module": "@jupyter-widgets/base",
1882
            "_view_module_version": "1.2.0",
1883
            "_view_name": "LayoutView",
1884
            "align_content": null,
1885
            "align_items": null,
1886
            "align_self": null,
1887
            "border": null,
1888
            "bottom": null,
1889
            "display": null,
1890
            "flex": null,
1891
            "flex_flow": null,
1892
            "grid_area": null,
1893
            "grid_auto_columns": null,
1894
            "grid_auto_flow": null,
1895
            "grid_auto_rows": null,
1896
            "grid_column": null,
1897
            "grid_gap": null,
1898
            "grid_row": null,
1899
            "grid_template_areas": null,
1900
            "grid_template_columns": null,
1901
            "grid_template_rows": null,
1902
            "height": null,
1903
            "justify_content": null,
1904
            "justify_items": null,
1905
            "left": null,
1906
            "margin": null,
1907
            "max_height": null,
1908
            "max_width": null,
1909
            "min_height": null,
1910
            "min_width": null,
1911
            "object_fit": null,
1912
            "object_position": null,
1913
            "order": null,
1914
            "overflow": null,
1915
            "overflow_x": null,
1916
            "overflow_y": null,
1917
            "padding": null,
1918
            "right": null,
1919
            "top": null,
1920
            "visibility": null,
1921
            "width": null
1922
          }
1923
        },
1924
        "89dc60db3b9a4a1587b00130ffde2311": {
1925
          "model_module": "@jupyter-widgets/controls",
1926
          "model_name": "ProgressStyleModel",
1927
          "model_module_version": "1.5.0",
1928
          "state": {
1929
            "_model_module": "@jupyter-widgets/controls",
1930
            "_model_module_version": "1.5.0",
1931
            "_model_name": "ProgressStyleModel",
1932
            "_view_count": null,
1933
            "_view_module": "@jupyter-widgets/base",
1934
            "_view_module_version": "1.2.0",
1935
            "_view_name": "StyleView",
1936
            "bar_color": null,
1937
            "description_width": ""
1938
          }
1939
        },
1940
        "9d0851b2c54c4e5cb635cd2652890824": {
1941
          "model_module": "@jupyter-widgets/base",
1942
          "model_name": "LayoutModel",
1943
          "model_module_version": "1.2.0",
1944
          "state": {
1945
            "_model_module": "@jupyter-widgets/base",
1946
            "_model_module_version": "1.2.0",
1947
            "_model_name": "LayoutModel",
1948
            "_view_count": null,
1949
            "_view_module": "@jupyter-widgets/base",
1950
            "_view_module_version": "1.2.0",
1951
            "_view_name": "LayoutView",
1952
            "align_content": null,
1953
            "align_items": null,
1954
            "align_self": null,
1955
            "border": null,
1956
            "bottom": null,
1957
            "display": null,
1958
            "flex": null,
1959
            "flex_flow": null,
1960
            "grid_area": null,
1961
            "grid_auto_columns": null,
1962
            "grid_auto_flow": null,
1963
            "grid_auto_rows": null,
1964
            "grid_column": null,
1965
            "grid_gap": null,
1966
            "grid_row": null,
1967
            "grid_template_areas": null,
1968
            "grid_template_columns": null,
1969
            "grid_template_rows": null,
1970
            "height": null,
1971
            "justify_content": null,
1972
            "justify_items": null,
1973
            "left": null,
1974
            "margin": null,
1975
            "max_height": null,
1976
            "max_width": null,
1977
            "min_height": null,
1978
            "min_width": null,
1979
            "object_fit": null,
1980
            "object_position": null,
1981
            "order": null,
1982
            "overflow": null,
1983
            "overflow_x": null,
1984
            "overflow_y": null,
1985
            "padding": null,
1986
            "right": null,
1987
            "top": null,
1988
            "visibility": null,
1989
            "width": null
1990
          }
1991
        },
1992
        "7a89919a4de9454aa8a7c134f1b1fa3d": {
1993
          "model_module": "@jupyter-widgets/controls",
1994
          "model_name": "DescriptionStyleModel",
1995
          "model_module_version": "1.5.0",
1996
          "state": {
1997
            "_model_module": "@jupyter-widgets/controls",
1998
            "_model_module_version": "1.5.0",
1999
            "_model_name": "DescriptionStyleModel",
2000
            "_view_count": null,
2001
            "_view_module": "@jupyter-widgets/base",
2002
            "_view_module_version": "1.2.0",
2003
            "_view_name": "StyleView",
2004
            "description_width": ""
2005
          }
2006
        },
2007
        "30fb290999b84d9eb69b8dd720c534b5": {
2008
          "model_module": "@jupyter-widgets/controls",
2009
          "model_name": "HBoxModel",
2010
          "model_module_version": "1.5.0",
2011
          "state": {
2012
            "_dom_classes": [],
2013
            "_model_module": "@jupyter-widgets/controls",
2014
            "_model_module_version": "1.5.0",
2015
            "_model_name": "HBoxModel",
2016
            "_view_count": null,
2017
            "_view_module": "@jupyter-widgets/controls",
2018
            "_view_module_version": "1.5.0",
2019
            "_view_name": "HBoxView",
2020
            "box_style": "",
2021
            "children": [
2022
              "IPY_MODEL_37a67b2e108248858858b72cf2d00aba",
2023
              "IPY_MODEL_a038d308888c40bca1cc45c962344ec6",
2024
              "IPY_MODEL_70bd55b8cd2f42d6b9ecd76c17972771"
2025
            ],
2026
            "layout": "IPY_MODEL_e18504b6c48a45ef8abe75f2d59147ea"
2027
          }
2028
        },
2029
        "37a67b2e108248858858b72cf2d00aba": {
2030
          "model_module": "@jupyter-widgets/controls",
2031
          "model_name": "HTMLModel",
2032
          "model_module_version": "1.5.0",
2033
          "state": {
2034
            "_dom_classes": [],
2035
            "_model_module": "@jupyter-widgets/controls",
2036
            "_model_module_version": "1.5.0",
2037
            "_model_name": "HTMLModel",
2038
            "_view_count": null,
2039
            "_view_module": "@jupyter-widgets/controls",
2040
            "_view_module_version": "1.5.0",
2041
            "_view_name": "HTMLView",
2042
            "description": "",
2043
            "description_tooltip": null,
2044
            "layout": "IPY_MODEL_b8e8032b75cf4b1eadfe76395f8811ac",
2045
            "placeholder": "​",
2046
            "style": "IPY_MODEL_dd6c2ab6494c48878a7521c0fc0e2109",
2047
            "value": "input_states.safetensors: 100%"
2048
          }
2049
        },
2050
        "a038d308888c40bca1cc45c962344ec6": {
2051
          "model_module": "@jupyter-widgets/controls",
2052
          "model_name": "FloatProgressModel",
2053
          "model_module_version": "1.5.0",
2054
          "state": {
2055
            "_dom_classes": [],
2056
            "_model_module": "@jupyter-widgets/controls",
2057
            "_model_module_version": "1.5.0",
2058
            "_model_name": "FloatProgressModel",
2059
            "_view_count": null,
2060
            "_view_module": "@jupyter-widgets/controls",
2061
            "_view_module_version": "1.5.0",
2062
            "_view_name": "ProgressView",
2063
            "bar_style": "success",
2064
            "description": "",
2065
            "description_tooltip": null,
2066
            "layout": "IPY_MODEL_6e98141655cc48d48f47f3981fb385e6",
2067
            "max": 1677721696,
2068
            "min": 0,
2069
            "orientation": "horizontal",
2070
            "style": "IPY_MODEL_fbf6c4c6ed85465095eb3ae986994c69",
2071
            "value": 1677721696
2072
          }
2073
        },
2074
        "70bd55b8cd2f42d6b9ecd76c17972771": {
2075
          "model_module": "@jupyter-widgets/controls",
2076
          "model_name": "HTMLModel",
2077
          "model_module_version": "1.5.0",
2078
          "state": {
2079
            "_dom_classes": [],
2080
            "_model_module": "@jupyter-widgets/controls",
2081
            "_model_module_version": "1.5.0",
2082
            "_model_name": "HTMLModel",
2083
            "_view_count": null,
2084
            "_view_module": "@jupyter-widgets/controls",
2085
            "_view_module_version": "1.5.0",
2086
            "_view_name": "HTMLView",
2087
            "description": "",
2088
            "description_tooltip": null,
2089
            "layout": "IPY_MODEL_95addcc750ad45ecbc37c5c7f463d812",
2090
            "placeholder": "​",
2091
            "style": "IPY_MODEL_0e8403a6428b4387a1ebbdecf7c7aa03",
2092
            "value": " 1.68G/1.68G [00:52&lt;00:00, 40.4MB/s]"
2093
          }
2094
        },
2095
        "e18504b6c48a45ef8abe75f2d59147ea": {
2096
          "model_module": "@jupyter-widgets/base",
2097
          "model_name": "LayoutModel",
2098
          "model_module_version": "1.2.0",
2099
          "state": {
2100
            "_model_module": "@jupyter-widgets/base",
2101
            "_model_module_version": "1.2.0",
2102
            "_model_name": "LayoutModel",
2103
            "_view_count": null,
2104
            "_view_module": "@jupyter-widgets/base",
2105
            "_view_module_version": "1.2.0",
2106
            "_view_name": "LayoutView",
2107
            "align_content": null,
2108
            "align_items": null,
2109
            "align_self": null,
2110
            "border": null,
2111
            "bottom": null,
2112
            "display": null,
2113
            "flex": null,
2114
            "flex_flow": null,
2115
            "grid_area": null,
2116
            "grid_auto_columns": null,
2117
            "grid_auto_flow": null,
2118
            "grid_auto_rows": null,
2119
            "grid_column": null,
2120
            "grid_gap": null,
2121
            "grid_row": null,
2122
            "grid_template_areas": null,
2123
            "grid_template_columns": null,
2124
            "grid_template_rows": null,
2125
            "height": null,
2126
            "justify_content": null,
2127
            "justify_items": null,
2128
            "left": null,
2129
            "margin": null,
2130
            "max_height": null,
2131
            "max_width": null,
2132
            "min_height": null,
2133
            "min_width": null,
2134
            "object_fit": null,
2135
            "object_position": null,
2136
            "order": null,
2137
            "overflow": null,
2138
            "overflow_x": null,
2139
            "overflow_y": null,
2140
            "padding": null,
2141
            "right": null,
2142
            "top": null,
2143
            "visibility": null,
2144
            "width": null
2145
          }
2146
        },
2147
        "b8e8032b75cf4b1eadfe76395f8811ac": {
2148
          "model_module": "@jupyter-widgets/base",
2149
          "model_name": "LayoutModel",
2150
          "model_module_version": "1.2.0",
2151
          "state": {
2152
            "_model_module": "@jupyter-widgets/base",
2153
            "_model_module_version": "1.2.0",
2154
            "_model_name": "LayoutModel",
2155
            "_view_count": null,
2156
            "_view_module": "@jupyter-widgets/base",
2157
            "_view_module_version": "1.2.0",
2158
            "_view_name": "LayoutView",
2159
            "align_content": null,
2160
            "align_items": null,
2161
            "align_self": null,
2162
            "border": null,
2163
            "bottom": null,
2164
            "display": null,
2165
            "flex": null,
2166
            "flex_flow": null,
2167
            "grid_area": null,
2168
            "grid_auto_columns": null,
2169
            "grid_auto_flow": null,
2170
            "grid_auto_rows": null,
2171
            "grid_column": null,
2172
            "grid_gap": null,
2173
            "grid_row": null,
2174
            "grid_template_areas": null,
2175
            "grid_template_columns": null,
2176
            "grid_template_rows": null,
2177
            "height": null,
2178
            "justify_content": null,
2179
            "justify_items": null,
2180
            "left": null,
2181
            "margin": null,
2182
            "max_height": null,
2183
            "max_width": null,
2184
            "min_height": null,
2185
            "min_width": null,
2186
            "object_fit": null,
2187
            "object_position": null,
2188
            "order": null,
2189
            "overflow": null,
2190
            "overflow_x": null,
2191
            "overflow_y": null,
2192
            "padding": null,
2193
            "right": null,
2194
            "top": null,
2195
            "visibility": null,
2196
            "width": null
2197
          }
2198
        },
2199
        "dd6c2ab6494c48878a7521c0fc0e2109": {
2200
          "model_module": "@jupyter-widgets/controls",
2201
          "model_name": "DescriptionStyleModel",
2202
          "model_module_version": "1.5.0",
2203
          "state": {
2204
            "_model_module": "@jupyter-widgets/controls",
2205
            "_model_module_version": "1.5.0",
2206
            "_model_name": "DescriptionStyleModel",
2207
            "_view_count": null,
2208
            "_view_module": "@jupyter-widgets/base",
2209
            "_view_module_version": "1.2.0",
2210
            "_view_name": "StyleView",
2211
            "description_width": ""
2212
          }
2213
        },
2214
        "6e98141655cc48d48f47f3981fb385e6": {
2215
          "model_module": "@jupyter-widgets/base",
2216
          "model_name": "LayoutModel",
2217
          "model_module_version": "1.2.0",
2218
          "state": {
2219
            "_model_module": "@jupyter-widgets/base",
2220
            "_model_module_version": "1.2.0",
2221
            "_model_name": "LayoutModel",
2222
            "_view_count": null,
2223
            "_view_module": "@jupyter-widgets/base",
2224
            "_view_module_version": "1.2.0",
2225
            "_view_name": "LayoutView",
2226
            "align_content": null,
2227
            "align_items": null,
2228
            "align_self": null,
2229
            "border": null,
2230
            "bottom": null,
2231
            "display": null,
2232
            "flex": null,
2233
            "flex_flow": null,
2234
            "grid_area": null,
2235
            "grid_auto_columns": null,
2236
            "grid_auto_flow": null,
2237
            "grid_auto_rows": null,
2238
            "grid_column": null,
2239
            "grid_gap": null,
2240
            "grid_row": null,
2241
            "grid_template_areas": null,
2242
            "grid_template_columns": null,
2243
            "grid_template_rows": null,
2244
            "height": null,
2245
            "justify_content": null,
2246
            "justify_items": null,
2247
            "left": null,
2248
            "margin": null,
2249
            "max_height": null,
2250
            "max_width": null,
2251
            "min_height": null,
2252
            "min_width": null,
2253
            "object_fit": null,
2254
            "object_position": null,
2255
            "order": null,
2256
            "overflow": null,
2257
            "overflow_x": null,
2258
            "overflow_y": null,
2259
            "padding": null,
2260
            "right": null,
2261
            "top": null,
2262
            "visibility": null,
2263
            "width": null
2264
          }
2265
        },
2266
        "fbf6c4c6ed85465095eb3ae986994c69": {
2267
          "model_module": "@jupyter-widgets/controls",
2268
          "model_name": "ProgressStyleModel",
2269
          "model_module_version": "1.5.0",
2270
          "state": {
2271
            "_model_module": "@jupyter-widgets/controls",
2272
            "_model_module_version": "1.5.0",
2273
            "_model_name": "ProgressStyleModel",
2274
            "_view_count": null,
2275
            "_view_module": "@jupyter-widgets/base",
2276
            "_view_module_version": "1.2.0",
2277
            "_view_name": "StyleView",
2278
            "bar_color": null,
2279
            "description_width": ""
2280
          }
2281
        },
2282
        "95addcc750ad45ecbc37c5c7f463d812": {
2283
          "model_module": "@jupyter-widgets/base",
2284
          "model_name": "LayoutModel",
2285
          "model_module_version": "1.2.0",
2286
          "state": {
2287
            "_model_module": "@jupyter-widgets/base",
2288
            "_model_module_version": "1.2.0",
2289
            "_model_name": "LayoutModel",
2290
            "_view_count": null,
2291
            "_view_module": "@jupyter-widgets/base",
2292
            "_view_module_version": "1.2.0",
2293
            "_view_name": "LayoutView",
2294
            "align_content": null,
2295
            "align_items": null,
2296
            "align_self": null,
2297
            "border": null,
2298
            "bottom": null,
2299
            "display": null,
2300
            "flex": null,
2301
            "flex_flow": null,
2302
            "grid_area": null,
2303
            "grid_auto_columns": null,
2304
            "grid_auto_flow": null,
2305
            "grid_auto_rows": null,
2306
            "grid_column": null,
2307
            "grid_gap": null,
2308
            "grid_row": null,
2309
            "grid_template_areas": null,
2310
            "grid_template_columns": null,
2311
            "grid_template_rows": null,
2312
            "height": null,
2313
            "justify_content": null,
2314
            "justify_items": null,
2315
            "left": null,
2316
            "margin": null,
2317
            "max_height": null,
2318
            "max_width": null,
2319
            "min_height": null,
2320
            "min_width": null,
2321
            "object_fit": null,
2322
            "object_position": null,
2323
            "order": null,
2324
            "overflow": null,
2325
            "overflow_x": null,
2326
            "overflow_y": null,
2327
            "padding": null,
2328
            "right": null,
2329
            "top": null,
2330
            "visibility": null,
2331
            "width": null
2332
          }
2333
        },
2334
        "0e8403a6428b4387a1ebbdecf7c7aa03": {
2335
          "model_module": "@jupyter-widgets/controls",
2336
          "model_name": "DescriptionStyleModel",
2337
          "model_module_version": "1.5.0",
2338
          "state": {
2339
            "_model_module": "@jupyter-widgets/controls",
2340
            "_model_module_version": "1.5.0",
2341
            "_model_name": "DescriptionStyleModel",
2342
            "_view_count": null,
2343
            "_view_module": "@jupyter-widgets/base",
2344
            "_view_module_version": "1.2.0",
2345
            "_view_name": "StyleView",
2346
            "description_width": ""
2347
          }
2348
        },
2349
        "945dffb008b44010807bf11ae1dbfec2": {
2350
          "model_module": "@jupyter-widgets/controls",
2351
          "model_name": "HBoxModel",
2352
          "model_module_version": "1.5.0",
2353
          "state": {
2354
            "_dom_classes": [],
2355
            "_model_module": "@jupyter-widgets/controls",
2356
            "_model_module_version": "1.5.0",
2357
            "_model_name": "HBoxModel",
2358
            "_view_count": null,
2359
            "_view_module": "@jupyter-widgets/controls",
2360
            "_view_module_version": "1.5.0",
2361
            "_view_name": "HBoxView",
2362
            "box_style": "",
2363
            "children": [
2364
              "IPY_MODEL_9a28c85b06bc49ce9c36534766b7650f",
2365
              "IPY_MODEL_46964345de59401ab8bc5f51dcfa94fd",
2366
              "IPY_MODEL_60b0f63948dd47fcb6d8aaab5bfedf5c"
2367
            ],
2368
            "layout": "IPY_MODEL_edc938cff4ec477b92ecb768f3ab2fab"
2369
          }
2370
        },
2371
        "9a28c85b06bc49ce9c36534766b7650f": {
2372
          "model_module": "@jupyter-widgets/controls",
2373
          "model_name": "HTMLModel",
2374
          "model_module_version": "1.5.0",
2375
          "state": {
2376
            "_dom_classes": [],
2377
            "_model_module": "@jupyter-widgets/controls",
2378
            "_model_module_version": "1.5.0",
2379
            "_model_name": "HTMLModel",
2380
            "_view_count": null,
2381
            "_view_module": "@jupyter-widgets/controls",
2382
            "_view_module_version": "1.5.0",
2383
            "_view_name": "HTMLView",
2384
            "description": "",
2385
            "description_tooltip": null,
2386
            "layout": "IPY_MODEL_7d3c1a673c614c819f5b83b8d9fb61ef",
2387
            "placeholder": "​",
2388
            "style": "IPY_MODEL_7a8b92bd2ea34c2181f6dcaaea9c5dee",
2389
            "value": "training_args.bin: 100%"
2390
          }
2391
        },
2392
        "46964345de59401ab8bc5f51dcfa94fd": {
2393
          "model_module": "@jupyter-widgets/controls",
2394
          "model_name": "FloatProgressModel",
2395
          "model_module_version": "1.5.0",
2396
          "state": {
2397
            "_dom_classes": [],
2398
            "_model_module": "@jupyter-widgets/controls",
2399
            "_model_module_version": "1.5.0",
2400
            "_model_name": "FloatProgressModel",
2401
            "_view_count": null,
2402
            "_view_module": "@jupyter-widgets/controls",
2403
            "_view_module_version": "1.5.0",
2404
            "_view_name": "ProgressView",
2405
            "bar_style": "success",
2406
            "description": "",
2407
            "description_tooltip": null,
2408
            "layout": "IPY_MODEL_6f83a7cd4e664e8aaf847196344d1256",
2409
            "max": 5435,
2410
            "min": 0,
2411
            "orientation": "horizontal",
2412
            "style": "IPY_MODEL_145c52ca456d4052af8b458578858176",
2413
            "value": 5435
2414
          }
2415
        },
2416
        "60b0f63948dd47fcb6d8aaab5bfedf5c": {
2417
          "model_module": "@jupyter-widgets/controls",
2418
          "model_name": "HTMLModel",
2419
          "model_module_version": "1.5.0",
2420
          "state": {
2421
            "_dom_classes": [],
2422
            "_model_module": "@jupyter-widgets/controls",
2423
            "_model_module_version": "1.5.0",
2424
            "_model_name": "HTMLModel",
2425
            "_view_count": null,
2426
            "_view_module": "@jupyter-widgets/controls",
2427
            "_view_module_version": "1.5.0",
2428
            "_view_name": "HTMLView",
2429
            "description": "",
2430
            "description_tooltip": null,
2431
            "layout": "IPY_MODEL_b3d7552080874350a3688dab8838452c",
2432
            "placeholder": "​",
2433
            "style": "IPY_MODEL_63e84ef3cff94a929602b8b419cd8071",
2434
            "value": " 5.43k/5.43k [00:00&lt;00:00, 8.05kB/s]"
2435
          }
2436
        },
2437
        "edc938cff4ec477b92ecb768f3ab2fab": {
2438
          "model_module": "@jupyter-widgets/base",
2439
          "model_name": "LayoutModel",
2440
          "model_module_version": "1.2.0",
2441
          "state": {
2442
            "_model_module": "@jupyter-widgets/base",
2443
            "_model_module_version": "1.2.0",
2444
            "_model_name": "LayoutModel",
2445
            "_view_count": null,
2446
            "_view_module": "@jupyter-widgets/base",
2447
            "_view_module_version": "1.2.0",
2448
            "_view_name": "LayoutView",
2449
            "align_content": null,
2450
            "align_items": null,
2451
            "align_self": null,
2452
            "border": null,
2453
            "bottom": null,
2454
            "display": null,
2455
            "flex": null,
2456
            "flex_flow": null,
2457
            "grid_area": null,
2458
            "grid_auto_columns": null,
2459
            "grid_auto_flow": null,
2460
            "grid_auto_rows": null,
2461
            "grid_column": null,
2462
            "grid_gap": null,
2463
            "grid_row": null,
2464
            "grid_template_areas": null,
2465
            "grid_template_columns": null,
2466
            "grid_template_rows": null,
2467
            "height": null,
2468
            "justify_content": null,
2469
            "justify_items": null,
2470
            "left": null,
2471
            "margin": null,
2472
            "max_height": null,
2473
            "max_width": null,
2474
            "min_height": null,
2475
            "min_width": null,
2476
            "object_fit": null,
2477
            "object_position": null,
2478
            "order": null,
2479
            "overflow": null,
2480
            "overflow_x": null,
2481
            "overflow_y": null,
2482
            "padding": null,
2483
            "right": null,
2484
            "top": null,
2485
            "visibility": null,
2486
            "width": null
2487
          }
2488
        },
2489
        "7d3c1a673c614c819f5b83b8d9fb61ef": {
2490
          "model_module": "@jupyter-widgets/base",
2491
          "model_name": "LayoutModel",
2492
          "model_module_version": "1.2.0",
2493
          "state": {
2494
            "_model_module": "@jupyter-widgets/base",
2495
            "_model_module_version": "1.2.0",
2496
            "_model_name": "LayoutModel",
2497
            "_view_count": null,
2498
            "_view_module": "@jupyter-widgets/base",
2499
            "_view_module_version": "1.2.0",
2500
            "_view_name": "LayoutView",
2501
            "align_content": null,
2502
            "align_items": null,
2503
            "align_self": null,
2504
            "border": null,
2505
            "bottom": null,
2506
            "display": null,
2507
            "flex": null,
2508
            "flex_flow": null,
2509
            "grid_area": null,
2510
            "grid_auto_columns": null,
2511
            "grid_auto_flow": null,
2512
            "grid_auto_rows": null,
2513
            "grid_column": null,
2514
            "grid_gap": null,
2515
            "grid_row": null,
2516
            "grid_template_areas": null,
2517
            "grid_template_columns": null,
2518
            "grid_template_rows": null,
2519
            "height": null,
2520
            "justify_content": null,
2521
            "justify_items": null,
2522
            "left": null,
2523
            "margin": null,
2524
            "max_height": null,
2525
            "max_width": null,
2526
            "min_height": null,
2527
            "min_width": null,
2528
            "object_fit": null,
2529
            "object_position": null,
2530
            "order": null,
2531
            "overflow": null,
2532
            "overflow_x": null,
2533
            "overflow_y": null,
2534
            "padding": null,
2535
            "right": null,
2536
            "top": null,
2537
            "visibility": null,
2538
            "width": null
2539
          }
2540
        },
2541
        "7a8b92bd2ea34c2181f6dcaaea9c5dee": {
2542
          "model_module": "@jupyter-widgets/controls",
2543
          "model_name": "DescriptionStyleModel",
2544
          "model_module_version": "1.5.0",
2545
          "state": {
2546
            "_model_module": "@jupyter-widgets/controls",
2547
            "_model_module_version": "1.5.0",
2548
            "_model_name": "DescriptionStyleModel",
2549
            "_view_count": null,
2550
            "_view_module": "@jupyter-widgets/base",
2551
            "_view_module_version": "1.2.0",
2552
            "_view_name": "StyleView",
2553
            "description_width": ""
2554
          }
2555
        },
2556
        "6f83a7cd4e664e8aaf847196344d1256": {
2557
          "model_module": "@jupyter-widgets/base",
2558
          "model_name": "LayoutModel",
2559
          "model_module_version": "1.2.0",
2560
          "state": {
2561
            "_model_module": "@jupyter-widgets/base",
2562
            "_model_module_version": "1.2.0",
2563
            "_model_name": "LayoutModel",
2564
            "_view_count": null,
2565
            "_view_module": "@jupyter-widgets/base",
2566
            "_view_module_version": "1.2.0",
2567
            "_view_name": "LayoutView",
2568
            "align_content": null,
2569
            "align_items": null,
2570
            "align_self": null,
2571
            "border": null,
2572
            "bottom": null,
2573
            "display": null,
2574
            "flex": null,
2575
            "flex_flow": null,
2576
            "grid_area": null,
2577
            "grid_auto_columns": null,
2578
            "grid_auto_flow": null,
2579
            "grid_auto_rows": null,
2580
            "grid_column": null,
2581
            "grid_gap": null,
2582
            "grid_row": null,
2583
            "grid_template_areas": null,
2584
            "grid_template_columns": null,
2585
            "grid_template_rows": null,
2586
            "height": null,
2587
            "justify_content": null,
2588
            "justify_items": null,
2589
            "left": null,
2590
            "margin": null,
2591
            "max_height": null,
2592
            "max_width": null,
2593
            "min_height": null,
2594
            "min_width": null,
2595
            "object_fit": null,
2596
            "object_position": null,
2597
            "order": null,
2598
            "overflow": null,
2599
            "overflow_x": null,
2600
            "overflow_y": null,
2601
            "padding": null,
2602
            "right": null,
2603
            "top": null,
2604
            "visibility": null,
2605
            "width": null
2606
          }
2607
        },
2608
        "145c52ca456d4052af8b458578858176": {
2609
          "model_module": "@jupyter-widgets/controls",
2610
          "model_name": "ProgressStyleModel",
2611
          "model_module_version": "1.5.0",
2612
          "state": {
2613
            "_model_module": "@jupyter-widgets/controls",
2614
            "_model_module_version": "1.5.0",
2615
            "_model_name": "ProgressStyleModel",
2616
            "_view_count": null,
2617
            "_view_module": "@jupyter-widgets/base",
2618
            "_view_module_version": "1.2.0",
2619
            "_view_name": "StyleView",
2620
            "bar_color": null,
2621
            "description_width": ""
2622
          }
2623
        },
2624
        "b3d7552080874350a3688dab8838452c": {
2625
          "model_module": "@jupyter-widgets/base",
2626
          "model_name": "LayoutModel",
2627
          "model_module_version": "1.2.0",
2628
          "state": {
2629
            "_model_module": "@jupyter-widgets/base",
2630
            "_model_module_version": "1.2.0",
2631
            "_model_name": "LayoutModel",
2632
            "_view_count": null,
2633
            "_view_module": "@jupyter-widgets/base",
2634
            "_view_module_version": "1.2.0",
2635
            "_view_name": "LayoutView",
2636
            "align_content": null,
2637
            "align_items": null,
2638
            "align_self": null,
2639
            "border": null,
2640
            "bottom": null,
2641
            "display": null,
2642
            "flex": null,
2643
            "flex_flow": null,
2644
            "grid_area": null,
2645
            "grid_auto_columns": null,
2646
            "grid_auto_flow": null,
2647
            "grid_auto_rows": null,
2648
            "grid_column": null,
2649
            "grid_gap": null,
2650
            "grid_row": null,
2651
            "grid_template_areas": null,
2652
            "grid_template_columns": null,
2653
            "grid_template_rows": null,
2654
            "height": null,
2655
            "justify_content": null,
2656
            "justify_items": null,
2657
            "left": null,
2658
            "margin": null,
2659
            "max_height": null,
2660
            "max_width": null,
2661
            "min_height": null,
2662
            "min_width": null,
2663
            "object_fit": null,
2664
            "object_position": null,
2665
            "order": null,
2666
            "overflow": null,
2667
            "overflow_x": null,
2668
            "overflow_y": null,
2669
            "padding": null,
2670
            "right": null,
2671
            "top": null,
2672
            "visibility": null,
2673
            "width": null
2674
          }
2675
        },
2676
        "63e84ef3cff94a929602b8b419cd8071": {
2677
          "model_module": "@jupyter-widgets/controls",
2678
          "model_name": "DescriptionStyleModel",
2679
          "model_module_version": "1.5.0",
2680
          "state": {
2681
            "_model_module": "@jupyter-widgets/controls",
2682
            "_model_module_version": "1.5.0",
2683
            "_model_name": "DescriptionStyleModel",
2684
            "_view_count": null,
2685
            "_view_module": "@jupyter-widgets/base",
2686
            "_view_module_version": "1.2.0",
2687
            "_view_name": "StyleView",
2688
            "description_width": ""
2689
          }
2690
        },
2691
        "55b59177fdb6441ba564d5f3f5dfa422": {
2692
          "model_module": "@jupyter-widgets/controls",
2693
          "model_name": "HBoxModel",
2694
          "model_module_version": "1.5.0",
2695
          "state": {
2696
            "_dom_classes": [],
2697
            "_model_module": "@jupyter-widgets/controls",
2698
            "_model_module_version": "1.5.0",
2699
            "_model_name": "HBoxModel",
2700
            "_view_count": null,
2701
            "_view_module": "@jupyter-widgets/controls",
2702
            "_view_module_version": "1.5.0",
2703
            "_view_name": "HBoxView",
2704
            "box_style": "",
2705
            "children": [
2706
              "IPY_MODEL_52d6cbef58b947119609460d41917399",
2707
              "IPY_MODEL_264f7e06376748dda35453413b382949",
2708
              "IPY_MODEL_1b84d95ea138413d8d8d1ea997741f86"
2709
            ],
2710
            "layout": "IPY_MODEL_8f581db41cd54f89a81f8424042190cf"
2711
          }
2712
        },
2713
        "52d6cbef58b947119609460d41917399": {
2714
          "model_module": "@jupyter-widgets/controls",
2715
          "model_name": "HTMLModel",
2716
          "model_module_version": "1.5.0",
2717
          "state": {
2718
            "_dom_classes": [],
2719
            "_model_module": "@jupyter-widgets/controls",
2720
            "_model_module_version": "1.5.0",
2721
            "_model_name": "HTMLModel",
2722
            "_view_count": null,
2723
            "_view_module": "@jupyter-widgets/controls",
2724
            "_view_module_version": "1.5.0",
2725
            "_view_name": "HTMLView",
2726
            "description": "",
2727
            "description_tooltip": null,
2728
            "layout": "IPY_MODEL_15ca60c283cb4fa389ed92e9433af851",
2729
            "placeholder": "​",
2730
            "style": "IPY_MODEL_ee220712a2e0467a8d07c473749a958c",
2731
            "value": "tokenizer.model: 100%"
2732
          }
2733
        },
2734
        "264f7e06376748dda35453413b382949": {
2735
          "model_module": "@jupyter-widgets/controls",
2736
          "model_name": "FloatProgressModel",
2737
          "model_module_version": "1.5.0",
2738
          "state": {
2739
            "_dom_classes": [],
2740
            "_model_module": "@jupyter-widgets/controls",
2741
            "_model_module_version": "1.5.0",
2742
            "_model_name": "FloatProgressModel",
2743
            "_view_count": null,
2744
            "_view_module": "@jupyter-widgets/controls",
2745
            "_view_module_version": "1.5.0",
2746
            "_view_name": "ProgressView",
2747
            "bar_style": "success",
2748
            "description": "",
2749
            "description_tooltip": null,
2750
            "layout": "IPY_MODEL_689c0aca3273499e820bad016d3ccaa9",
2751
            "max": 493443,
2752
            "min": 0,
2753
            "orientation": "horizontal",
2754
            "style": "IPY_MODEL_a2096f9286ab486e9baad9f349a23a95",
2755
            "value": 493443
2756
          }
2757
        },
2758
        "1b84d95ea138413d8d8d1ea997741f86": {
2759
          "model_module": "@jupyter-widgets/controls",
2760
          "model_name": "HTMLModel",
2761
          "model_module_version": "1.5.0",
2762
          "state": {
2763
            "_dom_classes": [],
2764
            "_model_module": "@jupyter-widgets/controls",
2765
            "_model_module_version": "1.5.0",
2766
            "_model_name": "HTMLModel",
2767
            "_view_count": null,
2768
            "_view_module": "@jupyter-widgets/controls",
2769
            "_view_module_version": "1.5.0",
2770
            "_view_name": "HTMLView",
2771
            "description": "",
2772
            "description_tooltip": null,
2773
            "layout": "IPY_MODEL_1bcc515d9d764c908af2988e29eaeeed",
2774
            "placeholder": "​",
2775
            "style": "IPY_MODEL_ca437b02cab741489217ad4d8780f728",
2776
            "value": " 493k/493k [00:00&lt;00:00, 22.9kB/s]"
2777
          }
2778
        },
2779
        "8f581db41cd54f89a81f8424042190cf": {
2780
          "model_module": "@jupyter-widgets/base",
2781
          "model_name": "LayoutModel",
2782
          "model_module_version": "1.2.0",
2783
          "state": {
2784
            "_model_module": "@jupyter-widgets/base",
2785
            "_model_module_version": "1.2.0",
2786
            "_model_name": "LayoutModel",
2787
            "_view_count": null,
2788
            "_view_module": "@jupyter-widgets/base",
2789
            "_view_module_version": "1.2.0",
2790
            "_view_name": "LayoutView",
2791
            "align_content": null,
2792
            "align_items": null,
2793
            "align_self": null,
2794
            "border": null,
2795
            "bottom": null,
2796
            "display": null,
2797
            "flex": null,
2798
            "flex_flow": null,
2799
            "grid_area": null,
2800
            "grid_auto_columns": null,
2801
            "grid_auto_flow": null,
2802
            "grid_auto_rows": null,
2803
            "grid_column": null,
2804
            "grid_gap": null,
2805
            "grid_row": null,
2806
            "grid_template_areas": null,
2807
            "grid_template_columns": null,
2808
            "grid_template_rows": null,
2809
            "height": null,
2810
            "justify_content": null,
2811
            "justify_items": null,
2812
            "left": null,
2813
            "margin": null,
2814
            "max_height": null,
2815
            "max_width": null,
2816
            "min_height": null,
2817
            "min_width": null,
2818
            "object_fit": null,
2819
            "object_position": null,
2820
            "order": null,
2821
            "overflow": null,
2822
            "overflow_x": null,
2823
            "overflow_y": null,
2824
            "padding": null,
2825
            "right": null,
2826
            "top": null,
2827
            "visibility": null,
2828
            "width": null
2829
          }
2830
        },
2831
        "15ca60c283cb4fa389ed92e9433af851": {
2832
          "model_module": "@jupyter-widgets/base",
2833
          "model_name": "LayoutModel",
2834
          "model_module_version": "1.2.0",
2835
          "state": {
2836
            "_model_module": "@jupyter-widgets/base",
2837
            "_model_module_version": "1.2.0",
2838
            "_model_name": "LayoutModel",
2839
            "_view_count": null,
2840
            "_view_module": "@jupyter-widgets/base",
2841
            "_view_module_version": "1.2.0",
2842
            "_view_name": "LayoutView",
2843
            "align_content": null,
2844
            "align_items": null,
2845
            "align_self": null,
2846
            "border": null,
2847
            "bottom": null,
2848
            "display": null,
2849
            "flex": null,
2850
            "flex_flow": null,
2851
            "grid_area": null,
2852
            "grid_auto_columns": null,
2853
            "grid_auto_flow": null,
2854
            "grid_auto_rows": null,
2855
            "grid_column": null,
2856
            "grid_gap": null,
2857
            "grid_row": null,
2858
            "grid_template_areas": null,
2859
            "grid_template_columns": null,
2860
            "grid_template_rows": null,
2861
            "height": null,
2862
            "justify_content": null,
2863
            "justify_items": null,
2864
            "left": null,
2865
            "margin": null,
2866
            "max_height": null,
2867
            "max_width": null,
2868
            "min_height": null,
2869
            "min_width": null,
2870
            "object_fit": null,
2871
            "object_position": null,
2872
            "order": null,
2873
            "overflow": null,
2874
            "overflow_x": null,
2875
            "overflow_y": null,
2876
            "padding": null,
2877
            "right": null,
2878
            "top": null,
2879
            "visibility": null,
2880
            "width": null
2881
          }
2882
        },
2883
        "ee220712a2e0467a8d07c473749a958c": {
2884
          "model_module": "@jupyter-widgets/controls",
2885
          "model_name": "DescriptionStyleModel",
2886
          "model_module_version": "1.5.0",
2887
          "state": {
2888
            "_model_module": "@jupyter-widgets/controls",
2889
            "_model_module_version": "1.5.0",
2890
            "_model_name": "DescriptionStyleModel",
2891
            "_view_count": null,
2892
            "_view_module": "@jupyter-widgets/base",
2893
            "_view_module_version": "1.2.0",
2894
            "_view_name": "StyleView",
2895
            "description_width": ""
2896
          }
2897
        },
2898
        "689c0aca3273499e820bad016d3ccaa9": {
2899
          "model_module": "@jupyter-widgets/base",
2900
          "model_name": "LayoutModel",
2901
          "model_module_version": "1.2.0",
2902
          "state": {
2903
            "_model_module": "@jupyter-widgets/base",
2904
            "_model_module_version": "1.2.0",
2905
            "_model_name": "LayoutModel",
2906
            "_view_count": null,
2907
            "_view_module": "@jupyter-widgets/base",
2908
            "_view_module_version": "1.2.0",
2909
            "_view_name": "LayoutView",
2910
            "align_content": null,
2911
            "align_items": null,
2912
            "align_self": null,
2913
            "border": null,
2914
            "bottom": null,
2915
            "display": null,
2916
            "flex": null,
2917
            "flex_flow": null,
2918
            "grid_area": null,
2919
            "grid_auto_columns": null,
2920
            "grid_auto_flow": null,
2921
            "grid_auto_rows": null,
2922
            "grid_column": null,
2923
            "grid_gap": null,
2924
            "grid_row": null,
2925
            "grid_template_areas": null,
2926
            "grid_template_columns": null,
2927
            "grid_template_rows": null,
2928
            "height": null,
2929
            "justify_content": null,
2930
            "justify_items": null,
2931
            "left": null,
2932
            "margin": null,
2933
            "max_height": null,
2934
            "max_width": null,
2935
            "min_height": null,
2936
            "min_width": null,
2937
            "object_fit": null,
2938
            "object_position": null,
2939
            "order": null,
2940
            "overflow": null,
2941
            "overflow_x": null,
2942
            "overflow_y": null,
2943
            "padding": null,
2944
            "right": null,
2945
            "top": null,
2946
            "visibility": null,
2947
            "width": null
2948
          }
2949
        },
2950
        "a2096f9286ab486e9baad9f349a23a95": {
2951
          "model_module": "@jupyter-widgets/controls",
2952
          "model_name": "ProgressStyleModel",
2953
          "model_module_version": "1.5.0",
2954
          "state": {
2955
            "_model_module": "@jupyter-widgets/controls",
2956
            "_model_module_version": "1.5.0",
2957
            "_model_name": "ProgressStyleModel",
2958
            "_view_count": null,
2959
            "_view_module": "@jupyter-widgets/base",
2960
            "_view_module_version": "1.2.0",
2961
            "_view_name": "StyleView",
2962
            "bar_color": null,
2963
            "description_width": ""
2964
          }
2965
        },
2966
        "1bcc515d9d764c908af2988e29eaeeed": {
2967
          "model_module": "@jupyter-widgets/base",
2968
          "model_name": "LayoutModel",
2969
          "model_module_version": "1.2.0",
2970
          "state": {
2971
            "_model_module": "@jupyter-widgets/base",
2972
            "_model_module_version": "1.2.0",
2973
            "_model_name": "LayoutModel",
2974
            "_view_count": null,
2975
            "_view_module": "@jupyter-widgets/base",
2976
            "_view_module_version": "1.2.0",
2977
            "_view_name": "LayoutView",
2978
            "align_content": null,
2979
            "align_items": null,
2980
            "align_self": null,
2981
            "border": null,
2982
            "bottom": null,
2983
            "display": null,
2984
            "flex": null,
2985
            "flex_flow": null,
2986
            "grid_area": null,
2987
            "grid_auto_columns": null,
2988
            "grid_auto_flow": null,
2989
            "grid_auto_rows": null,
2990
            "grid_column": null,
2991
            "grid_gap": null,
2992
            "grid_row": null,
2993
            "grid_template_areas": null,
2994
            "grid_template_columns": null,
2995
            "grid_template_rows": null,
2996
            "height": null,
2997
            "justify_content": null,
2998
            "justify_items": null,
2999
            "left": null,
3000
            "margin": null,
3001
            "max_height": null,
3002
            "max_width": null,
3003
            "min_height": null,
3004
            "min_width": null,
3005
            "object_fit": null,
3006
            "object_position": null,
3007
            "order": null,
3008
            "overflow": null,
3009
            "overflow_x": null,
3010
            "overflow_y": null,
3011
            "padding": null,
3012
            "right": null,
3013
            "top": null,
3014
            "visibility": null,
3015
            "width": null
3016
          }
3017
        },
3018
        "ca437b02cab741489217ad4d8780f728": {
3019
          "model_module": "@jupyter-widgets/controls",
3020
          "model_name": "DescriptionStyleModel",
3021
          "model_module_version": "1.5.0",
3022
          "state": {
3023
            "_model_module": "@jupyter-widgets/controls",
3024
            "_model_module_version": "1.5.0",
3025
            "_model_name": "DescriptionStyleModel",
3026
            "_view_count": null,
3027
            "_view_module": "@jupyter-widgets/base",
3028
            "_view_module_version": "1.2.0",
3029
            "_view_name": "StyleView",
3030
            "description_width": ""
3031
          }
3032
        }
3033
      }
3034
    }
3035
  },
3036
  "cells": [
3037
    {
3038
      "cell_type": "markdown",
3039
      "metadata": {
3040
        "id": "view-in-github",
3041
        "colab_type": "text"
3042
      },
3043
      "source": [
3044
        "<a href=\"https://colab.research.google.com/github/mlabonne/llm-course/blob/main/Quantize_models_with_ExLlamaV2.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
3045
      ]
3046
    },
3047
    {
3048
      "cell_type": "markdown",
3049
      "source": [
3050
        "# ExLlamaV2: The Fastest Library to Run LLMs\n",
3051
        "\n",
3052
        "❤️ Created by [@maximelabonne](https://twitter.com/maximelabonne) as part of the 🗣️ [Large Language Model Course](https://github.com/mlabonne/llm-course)."
3053
      ],
3054
      "metadata": {
3055
        "id": "QzUdY6GPiZXG"
3056
      }
3057
    },
3058
    {
3059
      "cell_type": "code",
3060
      "execution_count": null,
3061
      "metadata": {
3062
        "id": "4niZ8igkiXZb"
3063
      },
3064
      "outputs": [],
3065
      "source": [
3066
        "# Install ExLLamaV2\n",
3067
        "!git clone https://github.com/turboderp/exllamav2\n",
3068
        "!pip install -e exllamav2"
3069
      ]
3070
    },
3071
    {
3072
      "cell_type": "code",
3073
      "source": [
3074
        "MODEL_NAME = \"zephyr-7b-beta\"\n",
3075
        "BPW = 5.0\n",
3076
        "\n",
3077
        "# Download model\n",
3078
        "!git lfs install\n",
3079
        "!git clone https://huggingface.co/HuggingFaceH4/{MODEL_NAME}\n",
3080
        "!mv {MODEL_NAME} base_model\n",
3081
        "!rm base_mode/*.bin\n",
3082
        "\n",
3083
        "# Download dataset\n",
3084
        "!wget https://huggingface.co/datasets/wikitext/resolve/9a9e482b5987f9d25b3a9b2883fc6cc9fd8071b3/wikitext-103-v1/wikitext-test.parquet"
3085
      ],
3086
      "metadata": {
3087
        "colab": {
3088
          "base_uri": "https://localhost:8080/"
3089
        },
3090
        "id": "elHDPmXAil0c",
3091
        "outputId": "5b732dac-fead-4ab2-f3e8-7b3622d3c690"
3092
      },
3093
      "execution_count": null,
3094
      "outputs": [
3095
        {
3096
          "output_type": "stream",
3097
          "name": "stdout",
3098
          "text": [
3099
            "Git LFS initialized.\n",
3100
            "Cloning into 'zephyr-7b-beta'...\n",
3101
            "remote: Enumerating objects: 55, done.\u001b[K\n",
3102
            "remote: Total 55 (delta 0), reused 0 (delta 0), pack-reused 55\u001b[K\n",
3103
            "Unpacking objects: 100% (55/55), 534.67 KiB | 4.73 MiB/s, done.\n",
3104
            "Filtering content: 100% (10/10), 13.48 GiB | 129.35 MiB/s, done.\n",
3105
            "rm: cannot remove 'base_mode/*.bin': No such file or directory\n",
3106
            "--2023-11-03 18:05:02--  https://huggingface.co/datasets/wikitext/resolve/9a9e482b5987f9d25b3a9b2883fc6cc9fd8071b3/wikitext-103-v1/wikitext-test.parquet\n",
3107
            "Resolving huggingface.co (huggingface.co)... 65.8.178.27, 65.8.178.93, 65.8.178.118, ...\n",
3108
            "Connecting to huggingface.co (huggingface.co)|65.8.178.27|:443... connected.\n",
3109
            "HTTP request sent, awaiting response... 200 OK\n",
3110
            "Length: 721735 (705K)\n",
3111
            "Saving to: ‘wikitext-test.parquet’\n",
3112
            "\n",
3113
            "wikitext-test.parqu 100%[===================>] 704.82K  --.-KB/s    in 0.1s    \n",
3114
            "\n",
3115
            "2023-11-03 18:05:02 (5.57 MB/s) - ‘wikitext-test.parquet’ saved [721735/721735]\n",
3116
            "\n"
3117
          ]
3118
        }
3119
      ]
3120
    },
3121
    {
3122
      "cell_type": "code",
3123
      "source": [
3124
        "# Quantize model\n",
3125
        "!mkdir quant\n",
3126
        "!python exllamav2/convert.py \\\n",
3127
        "    -i base_model \\\n",
3128
        "    -o quant \\\n",
3129
        "    -c wikitext-test.parquet \\\n",
3130
        "    -b {BPW}"
3131
      ],
3132
      "metadata": {
3133
        "colab": {
3134
          "base_uri": "https://localhost:8080/"
3135
        },
3136
        "id": "jigQLg8Fis1f",
3137
        "outputId": "5f2e97ee-f823-45f7-f39a-f4c6a774b587"
3138
      },
3139
      "execution_count": null,
3140
      "outputs": [
3141
        {
3142
          "output_type": "stream",
3143
          "name": "stdout",
3144
          "text": [
3145
            "\u001b[1;30;43mStreaming output truncated to the last 5000 lines.\u001b[0m\n",
3146
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01444\n",
3147
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01401\n",
3148
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01332\n",
3149
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00876\n",
3150
            " -- Time: 3.78 seconds\n",
3151
            " -- Linear: model.layers.7.self_attn.o_proj\n",
3152
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.19280\n",
3153
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.17356\n",
3154
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.16492\n",
3155
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14247\n",
3156
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09048\n",
3157
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08221\n",
3158
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10930\n",
3159
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09792\n",
3160
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09219\n",
3161
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07561\n",
3162
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07156\n",
3163
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05653\n",
3164
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04767\n",
3165
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04434\n",
3166
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04352\n",
3167
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02850\n",
3168
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02416\n",
3169
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02348\n",
3170
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02138\n",
3171
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02088\n",
3172
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01587\n",
3173
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01675\n",
3174
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01480\n",
3175
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01294\n",
3176
            " -- Time: 6.21 seconds\n",
3177
            " -- Layer: model.layers.7 (MLP)\n",
3178
            " -- Linear: model.layers.7.mlp.gate_proj\n",
3179
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.17192\n",
3180
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16163\n",
3181
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15815\n",
3182
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14380\n",
3183
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08135\n",
3184
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07770\n",
3185
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.09087\n",
3186
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08363\n",
3187
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08210\n",
3188
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07280\n",
3189
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06958\n",
3190
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04646\n",
3191
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04014\n",
3192
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03912\n",
3193
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03888\n",
3194
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02327\n",
3195
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02036\n",
3196
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02012\n",
3197
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01866\n",
3198
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01851\n",
3199
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01246\n",
3200
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01264\n",
3201
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01212\n",
3202
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00882\n",
3203
            " -- Time: 16.78 seconds\n",
3204
            " -- Linear: model.layers.7.mlp.up_proj\n",
3205
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.24041\n",
3206
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22653\n",
3207
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.22191\n",
3208
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.20179\n",
3209
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11401\n",
3210
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10911\n",
3211
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12697\n",
3212
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11680\n",
3213
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11501\n",
3214
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10219\n",
3215
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09774\n",
3216
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06494\n",
3217
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05600\n",
3218
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05474\n",
3219
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05444\n",
3220
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03253\n",
3221
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02831\n",
3222
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02799\n",
3223
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02593\n",
3224
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02574\n",
3225
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01738\n",
3226
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01727\n",
3227
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01695\n",
3228
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01176\n",
3229
            " -- Time: 16.71 seconds\n",
3230
            " -- Linear: model.layers.7.mlp.down_proj\n",
3231
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.20930\n",
3232
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.18827\n",
3233
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17987\n",
3234
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16126\n",
3235
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09629\n",
3236
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.08799\n",
3237
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11395\n",
3238
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10350\n",
3239
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.09877\n",
3240
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08309\n",
3241
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07956\n",
3242
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05813\n",
3243
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04962\n",
3244
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04637\n",
3245
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04557\n",
3246
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02919\n",
3247
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02440\n",
3248
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02402\n",
3249
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02185\n",
3250
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02135\n",
3251
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01579\n",
3252
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01587\n",
3253
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01471\n",
3254
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01128\n",
3255
            " -- Time: 26.80 seconds\n",
3256
            " -- Layer: model.layers.8 (Attention)\n",
3257
            " -- Linear: model.layers.8.self_attn.q_proj\n",
3258
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.07321\n",
3259
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.06490\n",
3260
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.05988\n",
3261
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.05294\n",
3262
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.03374\n",
3263
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.02962\n",
3264
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.04266\n",
3265
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.03904\n",
3266
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.03463\n",
3267
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.02839\n",
3268
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.02717\n",
3269
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02166\n",
3270
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.01866\n",
3271
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.01627\n",
3272
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01567\n",
3273
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01085\n",
3274
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.00853\n",
3275
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00809\n",
3276
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00748\n",
3277
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00708\n",
3278
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00570\n",
3279
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00571\n",
3280
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00489\n",
3281
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00384\n",
3282
            " -- Time: 6.22 seconds\n",
3283
            " -- Linear: model.layers.8.self_attn.k_proj\n",
3284
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.06478\n",
3285
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.05636\n",
3286
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.05113\n",
3287
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.04496\n",
3288
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.02945\n",
3289
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.02518\n",
3290
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.03836\n",
3291
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.03491\n",
3292
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.03047\n",
3293
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.02440\n",
3294
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.02347\n",
3295
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.01943\n",
3296
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.01666\n",
3297
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.01420\n",
3298
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01356\n",
3299
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.00974\n",
3300
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.00741\n",
3301
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00695\n",
3302
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00641\n",
3303
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00598\n",
3304
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00506\n",
3305
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00499\n",
3306
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00419\n",
3307
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00326\n",
3308
            " -- Time: 3.87 seconds\n",
3309
            " -- Linear: model.layers.8.self_attn.v_proj\n",
3310
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.18482\n",
3311
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16487\n",
3312
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15686\n",
3313
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13830\n",
3314
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08576\n",
3315
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07784\n",
3316
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10130\n",
3317
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09213\n",
3318
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08768\n",
3319
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07196\n",
3320
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06795\n",
3321
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05156\n",
3322
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04405\n",
3323
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04111\n",
3324
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04040\n",
3325
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02577\n",
3326
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02116\n",
3327
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02051\n",
3328
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01835\n",
3329
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01788\n",
3330
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01333\n",
3331
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01308\n",
3332
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01217\n",
3333
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00845\n",
3334
            " -- Time: 3.83 seconds\n",
3335
            " -- Linear: model.layers.8.self_attn.o_proj\n",
3336
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.20113\n",
3337
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.18273\n",
3338
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17538\n",
3339
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15457\n",
3340
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09416\n",
3341
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08692\n",
3342
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11035\n",
3343
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10015\n",
3344
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09581\n",
3345
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08035\n",
3346
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07590\n",
3347
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05670\n",
3348
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04819\n",
3349
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04548\n",
3350
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04482\n",
3351
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02840\n",
3352
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02389\n",
3353
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02333\n",
3354
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02116\n",
3355
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02074\n",
3356
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01511\n",
3357
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01540\n",
3358
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01422\n",
3359
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01094\n",
3360
            " -- Time: 6.22 seconds\n",
3361
            " -- Layer: model.layers.8 (MLP)\n",
3362
            " -- Linear: model.layers.8.mlp.gate_proj\n",
3363
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.16797\n",
3364
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.15806\n",
3365
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15463\n",
3366
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14046\n",
3367
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07949\n",
3368
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07596\n",
3369
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08895\n",
3370
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08186\n",
3371
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08023\n",
3372
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07119\n",
3373
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06813\n",
3374
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04545\n",
3375
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03924\n",
3376
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03820\n",
3377
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03795\n",
3378
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02274\n",
3379
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01983\n",
3380
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01959\n",
3381
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01817\n",
3382
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01801\n",
3383
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01210\n",
3384
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01225\n",
3385
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01176\n",
3386
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00845\n",
3387
            " -- Time: 16.76 seconds\n",
3388
            " -- Linear: model.layers.8.mlp.up_proj\n",
3389
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23683\n",
3390
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22306\n",
3391
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21845\n",
3392
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19867\n",
3393
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11225\n",
3394
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10738\n",
3395
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12523\n",
3396
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11508\n",
3397
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11321\n",
3398
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10052\n",
3399
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09621\n",
3400
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06397\n",
3401
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05514\n",
3402
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05385\n",
3403
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05353\n",
3404
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03199\n",
3405
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02772\n",
3406
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02740\n",
3407
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02534\n",
3408
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02515\n",
3409
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01690\n",
3410
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01674\n",
3411
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01646\n",
3412
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01114\n",
3413
            " -- Time: 16.72 seconds\n",
3414
            " -- Linear: model.layers.8.mlp.down_proj\n",
3415
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.21367\n",
3416
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19327\n",
3417
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.18532\n",
3418
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16520\n",
3419
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09845\n",
3420
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09059\n",
3421
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11554\n",
3422
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10506\n",
3423
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10081\n",
3424
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08507\n",
3425
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08090\n",
3426
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05900\n",
3427
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05049\n",
3428
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04752\n",
3429
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04679\n",
3430
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02977\n",
3431
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02519\n",
3432
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02484\n",
3433
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02262\n",
3434
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02216\n",
3435
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01638\n",
3436
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01655\n",
3437
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01541\n",
3438
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01205\n",
3439
            " -- Time: 26.78 seconds\n",
3440
            " -- Layer: model.layers.9 (Attention)\n",
3441
            " -- Linear: model.layers.9.self_attn.q_proj\n",
3442
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.09374\n",
3443
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.08343\n",
3444
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.07735\n",
3445
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.06843\n",
3446
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04327\n",
3447
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03822\n",
3448
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05469\n",
3449
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.04960\n",
3450
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04431\n",
3451
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03654\n",
3452
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03500\n",
3453
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02782\n",
3454
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02380\n",
3455
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02096\n",
3456
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02024\n",
3457
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01396\n",
3458
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01116\n",
3459
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01065\n",
3460
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00987\n",
3461
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00942\n",
3462
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00745\n",
3463
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00763\n",
3464
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00645\n",
3465
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00545\n",
3466
            " -- Time: 6.22 seconds\n",
3467
            " -- Linear: model.layers.9.self_attn.k_proj\n",
3468
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.08149\n",
3469
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.07163\n",
3470
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.06561\n",
3471
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.05786\n",
3472
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.03729\n",
3473
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03228\n",
3474
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.04811\n",
3475
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.04369\n",
3476
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.03838\n",
3477
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03122\n",
3478
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03000\n",
3479
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02446\n",
3480
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02089\n",
3481
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.01795\n",
3482
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01722\n",
3483
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01224\n",
3484
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.00937\n",
3485
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00884\n",
3486
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00818\n",
3487
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00768\n",
3488
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00637\n",
3489
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00628\n",
3490
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00533\n",
3491
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00413\n",
3492
            " -- Time: 3.79 seconds\n",
3493
            " -- Linear: model.layers.9.self_attn.v_proj\n",
3494
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.19517\n",
3495
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.17711\n",
3496
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17032\n",
3497
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15017\n",
3498
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09130\n",
3499
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08444\n",
3500
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10496\n",
3501
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09629\n",
3502
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09271\n",
3503
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07744\n",
3504
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07277\n",
3505
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05330\n",
3506
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04590\n",
3507
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04365\n",
3508
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04312\n",
3509
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02659\n",
3510
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02217\n",
3511
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02165\n",
3512
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01932\n",
3513
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01895\n",
3514
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01363\n",
3515
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01317\n",
3516
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01279\n",
3517
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00804\n",
3518
            " -- Time: 3.80 seconds\n",
3519
            " -- Linear: model.layers.9.self_attn.o_proj\n",
3520
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.20153\n",
3521
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.18239\n",
3522
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17453\n",
3523
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15316\n",
3524
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09457\n",
3525
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08706\n",
3526
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11063\n",
3527
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10074\n",
3528
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09616\n",
3529
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07951\n",
3530
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07566\n",
3531
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05678\n",
3532
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04841\n",
3533
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04560\n",
3534
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04491\n",
3535
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02841\n",
3536
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02377\n",
3537
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02318\n",
3538
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02077\n",
3539
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02032\n",
3540
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01498\n",
3541
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01511\n",
3542
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01403\n",
3543
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01042\n",
3544
            " -- Time: 6.20 seconds\n",
3545
            " -- Layer: model.layers.9 (MLP)\n",
3546
            " -- Linear: model.layers.9.mlp.gate_proj\n",
3547
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.16709\n",
3548
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.15677\n",
3549
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15316\n",
3550
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13897\n",
3551
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07902\n",
3552
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07526\n",
3553
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08855\n",
3554
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08146\n",
3555
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07979\n",
3556
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07048\n",
3557
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06740\n",
3558
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04528\n",
3559
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03912\n",
3560
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03803\n",
3561
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03776\n",
3562
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02269\n",
3563
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01986\n",
3564
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01961\n",
3565
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01817\n",
3566
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01801\n",
3567
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01216\n",
3568
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01244\n",
3569
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01179\n",
3570
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00879\n",
3571
            " -- Time: 16.77 seconds\n",
3572
            " -- Linear: model.layers.9.mlp.up_proj\n",
3573
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23248\n",
3574
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21835\n",
3575
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21353\n",
3576
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19385\n",
3577
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10999\n",
3578
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10496\n",
3579
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12290\n",
3580
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11303\n",
3581
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11108\n",
3582
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09819\n",
3583
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09389\n",
3584
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06283\n",
3585
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05418\n",
3586
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05282\n",
3587
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05250\n",
3588
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03146\n",
3589
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02733\n",
3590
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02699\n",
3591
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02495\n",
3592
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02474\n",
3593
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01676\n",
3594
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01671\n",
3595
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01630\n",
3596
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01137\n",
3597
            " -- Time: 16.69 seconds\n",
3598
            " -- Linear: model.layers.9.mlp.down_proj\n",
3599
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.22017\n",
3600
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19862\n",
3601
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19033\n",
3602
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16911\n",
3603
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10144\n",
3604
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09320\n",
3605
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11938\n",
3606
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10841\n",
3607
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10391\n",
3608
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08730\n",
3609
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08272\n",
3610
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06067\n",
3611
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05196\n",
3612
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04883\n",
3613
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04807\n",
3614
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03050\n",
3615
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02563\n",
3616
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02526\n",
3617
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02287\n",
3618
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02239\n",
3619
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01654\n",
3620
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01652\n",
3621
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01550\n",
3622
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01166\n",
3623
            " -- Time: 26.75 seconds\n",
3624
            " -- Layer: model.layers.10 (Attention)\n",
3625
            " -- Linear: model.layers.10.self_attn.q_proj\n",
3626
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.08235\n",
3627
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.07363\n",
3628
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.06866\n",
3629
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.06023\n",
3630
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.03814\n",
3631
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03398\n",
3632
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.04728\n",
3633
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.04319\n",
3634
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.03894\n",
3635
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03206\n",
3636
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03048\n",
3637
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02402\n",
3638
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02064\n",
3639
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.01838\n",
3640
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01782\n",
3641
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01202\n",
3642
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.00962\n",
3643
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00919\n",
3644
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00842\n",
3645
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00805\n",
3646
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00633\n",
3647
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00634\n",
3648
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00553\n",
3649
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00428\n",
3650
            " -- Time: 6.20 seconds\n",
3651
            " -- Linear: model.layers.10.self_attn.k_proj\n",
3652
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.07516\n",
3653
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.06653\n",
3654
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.06168\n",
3655
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.05393\n",
3656
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.03452\n",
3657
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03046\n",
3658
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.04334\n",
3659
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.03936\n",
3660
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.03536\n",
3661
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.02875\n",
3662
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.02734\n",
3663
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02195\n",
3664
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.01879\n",
3665
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.01658\n",
3666
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01603\n",
3667
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01097\n",
3668
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.00858\n",
3669
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00817\n",
3670
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00742\n",
3671
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00705\n",
3672
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00568\n",
3673
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00556\n",
3674
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00487\n",
3675
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00357\n",
3676
            " -- Time: 3.77 seconds\n",
3677
            " -- Linear: model.layers.10.self_attn.v_proj\n",
3678
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.18187\n",
3679
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16366\n",
3680
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15689\n",
3681
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13720\n",
3682
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08496\n",
3683
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07789\n",
3684
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.09894\n",
3685
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08995\n",
3686
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08648\n",
3687
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07118\n",
3688
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06690\n",
3689
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05035\n",
3690
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04296\n",
3691
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04066\n",
3692
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04012\n",
3693
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02514\n",
3694
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02081\n",
3695
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02025\n",
3696
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01800\n",
3697
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01762\n",
3698
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01297\n",
3699
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01259\n",
3700
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01205\n",
3701
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00796\n",
3702
            " -- Time: 3.83 seconds\n",
3703
            " -- Linear: model.layers.10.self_attn.o_proj\n",
3704
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.19772\n",
3705
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.17857\n",
3706
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17053\n",
3707
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14967\n",
3708
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09223\n",
3709
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08466\n",
3710
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10913\n",
3711
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09919\n",
3712
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09394\n",
3713
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07816\n",
3714
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07389\n",
3715
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05624\n",
3716
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04783\n",
3717
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04464\n",
3718
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04390\n",
3719
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02824\n",
3720
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02368\n",
3721
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02304\n",
3722
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02093\n",
3723
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02045\n",
3724
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01527\n",
3725
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01561\n",
3726
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01425\n",
3727
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01133\n",
3728
            " -- Time: 6.18 seconds\n",
3729
            " -- Layer: model.layers.10 (MLP)\n",
3730
            " -- Linear: model.layers.10.mlp.gate_proj\n",
3731
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.16458\n",
3732
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.15345\n",
3733
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.14950\n",
3734
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13525\n",
3735
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07763\n",
3736
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07360\n",
3737
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08755\n",
3738
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08045\n",
3739
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07854\n",
3740
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06883\n",
3741
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06571\n",
3742
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04474\n",
3743
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03864\n",
3744
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03735\n",
3745
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03705\n",
3746
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02242\n",
3747
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01952\n",
3748
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01924\n",
3749
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01778\n",
3750
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01760\n",
3751
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01199\n",
3752
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01228\n",
3753
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01155\n",
3754
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00867\n",
3755
            " -- Time: 16.72 seconds\n",
3756
            " -- Linear: model.layers.10.mlp.up_proj\n",
3757
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.22519\n",
3758
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21022\n",
3759
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20510\n",
3760
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18548\n",
3761
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10629\n",
3762
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10090\n",
3763
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11927\n",
3764
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10970\n",
3765
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10747\n",
3766
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09419\n",
3767
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08985\n",
3768
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06086\n",
3769
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05254\n",
3770
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05097\n",
3771
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05060\n",
3772
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03043\n",
3773
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02627\n",
3774
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02590\n",
3775
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02382\n",
3776
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02359\n",
3777
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01601\n",
3778
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01597\n",
3779
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01546\n",
3780
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01065\n",
3781
            " -- Time: 16.67 seconds\n",
3782
            " -- Linear: model.layers.10.mlp.down_proj\n",
3783
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.23070\n",
3784
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20868\n",
3785
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20041\n",
3786
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17776\n",
3787
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10675\n",
3788
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09841\n",
3789
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12502\n",
3790
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11343\n",
3791
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10921\n",
3792
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09194\n",
3793
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08704\n",
3794
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06390\n",
3795
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05452\n",
3796
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05149\n",
3797
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.05076\n",
3798
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03217\n",
3799
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02720\n",
3800
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02684\n",
3801
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02433\n",
3802
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02387\n",
3803
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01749\n",
3804
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01771\n",
3805
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01646\n",
3806
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01279\n",
3807
            " -- Time: 26.77 seconds\n",
3808
            " -- Layer: model.layers.11 (Attention)\n",
3809
            " -- Linear: model.layers.11.self_attn.q_proj\n",
3810
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.09637\n",
3811
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.08586\n",
3812
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.08008\n",
3813
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07014\n",
3814
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04477\n",
3815
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03986\n",
3816
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05541\n",
3817
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05047\n",
3818
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04572\n",
3819
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03744\n",
3820
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03559\n",
3821
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02819\n",
3822
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02421\n",
3823
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02166\n",
3824
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02103\n",
3825
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01414\n",
3826
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01146\n",
3827
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01098\n",
3828
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01004\n",
3829
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00963\n",
3830
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00750\n",
3831
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00769\n",
3832
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00661\n",
3833
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00542\n",
3834
            " -- Time: 6.22 seconds\n",
3835
            " -- Linear: model.layers.11.self_attn.k_proj\n",
3836
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.08114\n",
3837
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.07195\n",
3838
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.06606\n",
3839
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.05768\n",
3840
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.03737\n",
3841
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03267\n",
3842
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.04767\n",
3843
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.04342\n",
3844
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.03824\n",
3845
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03114\n",
3846
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.02972\n",
3847
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02425\n",
3848
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02075\n",
3849
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.01802\n",
3850
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01732\n",
3851
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01210\n",
3852
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.00943\n",
3853
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00893\n",
3854
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00821\n",
3855
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00775\n",
3856
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00635\n",
3857
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00631\n",
3858
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00541\n",
3859
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00423\n",
3860
            " -- Time: 3.82 seconds\n",
3861
            " -- Linear: model.layers.11.self_attn.v_proj\n",
3862
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.19703\n",
3863
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.17551\n",
3864
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.16728\n",
3865
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14535\n",
3866
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09159\n",
3867
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08328\n",
3868
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10811\n",
3869
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09762\n",
3870
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09342\n",
3871
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07590\n",
3872
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07111\n",
3873
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05511\n",
3874
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04670\n",
3875
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04391\n",
3876
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04323\n",
3877
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02758\n",
3878
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02246\n",
3879
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02183\n",
3880
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01924\n",
3881
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01879\n",
3882
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01423\n",
3883
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01368\n",
3884
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01300\n",
3885
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00864\n",
3886
            " -- Time: 3.92 seconds\n",
3887
            " -- Linear: model.layers.11.self_attn.o_proj\n",
3888
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.19597\n",
3889
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.17847\n",
3890
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.16379\n",
3891
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14511\n",
3892
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09237\n",
3893
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08126\n",
3894
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12329\n",
3895
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11030\n",
3896
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09394\n",
3897
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07962\n",
3898
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07759\n",
3899
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06377\n",
3900
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05341\n",
3901
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04512\n",
3902
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04298\n",
3903
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03193\n",
3904
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02434\n",
3905
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02296\n",
3906
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02192\n",
3907
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02058\n",
3908
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01710\n",
3909
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01736\n",
3910
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01424\n",
3911
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01256\n",
3912
            " -- Time: 6.20 seconds\n",
3913
            " -- Layer: model.layers.11 (MLP)\n",
3914
            " -- Linear: model.layers.11.mlp.gate_proj\n",
3915
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.16838\n",
3916
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.15674\n",
3917
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15241\n",
3918
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13774\n",
3919
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07955\n",
3920
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07520\n",
3921
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.09017\n",
3922
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08269\n",
3923
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08051\n",
3924
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07030\n",
3925
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06713\n",
3926
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04617\n",
3927
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03980\n",
3928
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03838\n",
3929
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03804\n",
3930
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02317\n",
3931
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02025\n",
3932
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01994\n",
3933
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01844\n",
3934
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01824\n",
3935
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01252\n",
3936
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01300\n",
3937
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01203\n",
3938
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00944\n",
3939
            " -- Time: 16.79 seconds\n",
3940
            " -- Linear: model.layers.11.mlp.up_proj\n",
3941
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.22740\n",
3942
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21181\n",
3943
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20640\n",
3944
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18641\n",
3945
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10722\n",
3946
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10159\n",
3947
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12081\n",
3948
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11093\n",
3949
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10846\n",
3950
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09479\n",
3951
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09032\n",
3952
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06150\n",
3953
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05311\n",
3954
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05143\n",
3955
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05102\n",
3956
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03077\n",
3957
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02649\n",
3958
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02609\n",
3959
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02397\n",
3960
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02371\n",
3961
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01611\n",
3962
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01609\n",
3963
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01551\n",
3964
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01069\n",
3965
            " -- Time: 16.77 seconds\n",
3966
            " -- Linear: model.layers.11.mlp.down_proj\n",
3967
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.22960\n",
3968
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20772\n",
3969
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19942\n",
3970
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17705\n",
3971
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10644\n",
3972
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09805\n",
3973
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12519\n",
3974
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11322\n",
3975
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10894\n",
3976
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09175\n",
3977
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08694\n",
3978
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06400\n",
3979
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05447\n",
3980
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05138\n",
3981
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.05062\n",
3982
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03219\n",
3983
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02714\n",
3984
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02677\n",
3985
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02429\n",
3986
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02381\n",
3987
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01739\n",
3988
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01767\n",
3989
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01632\n",
3990
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01276\n",
3991
            " -- Time: 26.84 seconds\n",
3992
            " -- Layer: model.layers.12 (Attention)\n",
3993
            " -- Linear: model.layers.12.self_attn.q_proj\n",
3994
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.10068\n",
3995
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.08938\n",
3996
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.08243\n",
3997
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07225\n",
3998
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04673\n",
3999
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04101\n",
4000
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06037\n",
4001
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05396\n",
4002
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04786\n",
4003
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03913\n",
4004
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03765\n",
4005
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03088\n",
4006
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02602\n",
4007
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02269\n",
4008
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02185\n",
4009
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01557\n",
4010
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01216\n",
4011
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01156\n",
4012
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01071\n",
4013
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01017\n",
4014
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00838\n",
4015
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00843\n",
4016
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00714\n",
4017
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00606\n",
4018
            " -- Time: 6.25 seconds\n",
4019
            " -- Linear: model.layers.12.self_attn.k_proj\n",
4020
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.08574\n",
4021
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.07553\n",
4022
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.06922\n",
4023
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.06050\n",
4024
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.03941\n",
4025
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03421\n",
4026
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05104\n",
4027
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.04590\n",
4028
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04042\n",
4029
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03277\n",
4030
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03136\n",
4031
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02597\n",
4032
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02200\n",
4033
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.01905\n",
4034
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01829\n",
4035
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01302\n",
4036
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01004\n",
4037
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00951\n",
4038
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00876\n",
4039
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00826\n",
4040
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00686\n",
4041
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00683\n",
4042
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00579\n",
4043
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00469\n",
4044
            " -- Time: 3.85 seconds\n",
4045
            " -- Linear: model.layers.12.self_attn.v_proj\n",
4046
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.19504\n",
4047
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.17522\n",
4048
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.16722\n",
4049
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14655\n",
4050
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09135\n",
4051
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08336\n",
4052
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10798\n",
4053
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09762\n",
4054
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09299\n",
4055
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07656\n",
4056
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07215\n",
4057
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05508\n",
4058
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04669\n",
4059
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04381\n",
4060
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04310\n",
4061
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02753\n",
4062
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02244\n",
4063
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02178\n",
4064
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01939\n",
4065
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01891\n",
4066
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01422\n",
4067
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01369\n",
4068
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01304\n",
4069
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00864\n",
4070
            " -- Time: 3.84 seconds\n",
4071
            " -- Linear: model.layers.12.self_attn.o_proj\n",
4072
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.21198\n",
4073
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.18789\n",
4074
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17851\n",
4075
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15663\n",
4076
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09908\n",
4077
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08925\n",
4078
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11771\n",
4079
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10642\n",
4080
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10141\n",
4081
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08235\n",
4082
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07812\n",
4083
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06074\n",
4084
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05148\n",
4085
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04812\n",
4086
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04730\n",
4087
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03056\n",
4088
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02559\n",
4089
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02480\n",
4090
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02233\n",
4091
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02180\n",
4092
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01657\n",
4093
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01693\n",
4094
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01547\n",
4095
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01239\n",
4096
            " -- Time: 6.23 seconds\n",
4097
            " -- Layer: model.layers.12 (MLP)\n",
4098
            " -- Linear: model.layers.12.mlp.gate_proj\n",
4099
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.17317\n",
4100
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16089\n",
4101
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15653\n",
4102
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14139\n",
4103
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08192\n",
4104
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07739\n",
4105
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.09302\n",
4106
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08500\n",
4107
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08295\n",
4108
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07225\n",
4109
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06919\n",
4110
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04771\n",
4111
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04103\n",
4112
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03965\n",
4113
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03932\n",
4114
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02403\n",
4115
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02109\n",
4116
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02078\n",
4117
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01922\n",
4118
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01902\n",
4119
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01327\n",
4120
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01375\n",
4121
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01282\n",
4122
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01025\n",
4123
            " -- Time: 16.80 seconds\n",
4124
            " -- Linear: model.layers.12.mlp.up_proj\n",
4125
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23561\n",
4126
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21922\n",
4127
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21368\n",
4128
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19274\n",
4129
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11136\n",
4130
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10544\n",
4131
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12512\n",
4132
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11497\n",
4133
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11266\n",
4134
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09816\n",
4135
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09356\n",
4136
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06397\n",
4137
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05511\n",
4138
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05348\n",
4139
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05310\n",
4140
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03199\n",
4141
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02766\n",
4142
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02727\n",
4143
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02501\n",
4144
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02476\n",
4145
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01693\n",
4146
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01695\n",
4147
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01637\n",
4148
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01149\n",
4149
            " -- Time: 16.72 seconds\n",
4150
            " -- Linear: model.layers.12.mlp.down_proj\n",
4151
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.23220\n",
4152
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20919\n",
4153
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19921\n",
4154
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17615\n",
4155
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10738\n",
4156
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09804\n",
4157
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12854\n",
4158
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11635\n",
4159
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.11008\n",
4160
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09202\n",
4161
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08705\n",
4162
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06542\n",
4163
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05593\n",
4164
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05194\n",
4165
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.05095\n",
4166
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03304\n",
4167
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02763\n",
4168
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02712\n",
4169
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02468\n",
4170
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02405\n",
4171
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01806\n",
4172
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01837\n",
4173
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01671\n",
4174
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01338\n",
4175
            " -- Time: 26.78 seconds\n",
4176
            " -- Layer: model.layers.13 (Attention)\n",
4177
            " -- Linear: model.layers.13.self_attn.q_proj\n",
4178
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.10346\n",
4179
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09299\n",
4180
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.08766\n",
4181
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07699\n",
4182
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04820\n",
4183
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04354\n",
4184
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05839\n",
4185
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05322\n",
4186
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04910\n",
4187
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04058\n",
4188
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03850\n",
4189
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02967\n",
4190
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02545\n",
4191
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02319\n",
4192
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02264\n",
4193
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01485\n",
4194
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01207\n",
4195
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01163\n",
4196
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01055\n",
4197
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01019\n",
4198
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00778\n",
4199
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00777\n",
4200
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00696\n",
4201
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00522\n",
4202
            " -- Time: 6.21 seconds\n",
4203
            " -- Linear: model.layers.13.self_attn.k_proj\n",
4204
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.08538\n",
4205
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.07664\n",
4206
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.07156\n",
4207
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.06280\n",
4208
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.03961\n",
4209
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03533\n",
4210
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.04917\n",
4211
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.04484\n",
4212
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04036\n",
4213
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03339\n",
4214
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03179\n",
4215
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02494\n",
4216
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02147\n",
4217
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.01905\n",
4218
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01847\n",
4219
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01246\n",
4220
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.00989\n",
4221
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00945\n",
4222
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00865\n",
4223
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00825\n",
4224
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00651\n",
4225
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00643\n",
4226
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00569\n",
4227
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00422\n",
4228
            " -- Time: 3.82 seconds\n",
4229
            " -- Linear: model.layers.13.self_attn.v_proj\n",
4230
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.21169\n",
4231
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19023\n",
4232
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.18235\n",
4233
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15968\n",
4234
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09888\n",
4235
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09079\n",
4236
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11536\n",
4237
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10443\n",
4238
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10062\n",
4239
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08274\n",
4240
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07782\n",
4241
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05883\n",
4242
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04983\n",
4243
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04732\n",
4244
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04671\n",
4245
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02938\n",
4246
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02406\n",
4247
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02345\n",
4248
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02073\n",
4249
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02031\n",
4250
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01508\n",
4251
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01435\n",
4252
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01392\n",
4253
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00878\n",
4254
            " -- Time: 3.81 seconds\n",
4255
            " -- Linear: model.layers.13.self_attn.o_proj\n",
4256
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.22985\n",
4257
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20997\n",
4258
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20194\n",
4259
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18065\n",
4260
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10763\n",
4261
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09973\n",
4262
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12558\n",
4263
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11441\n",
4264
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10930\n",
4265
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09282\n",
4266
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08926\n",
4267
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06461\n",
4268
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05522\n",
4269
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05212\n",
4270
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05139\n",
4271
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03240\n",
4272
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02762\n",
4273
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02700\n",
4274
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02472\n",
4275
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02425\n",
4276
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01745\n",
4277
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01809\n",
4278
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01647\n",
4279
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01319\n",
4280
            " -- Time: 6.19 seconds\n",
4281
            " -- Layer: model.layers.13 (MLP)\n",
4282
            " -- Linear: model.layers.13.mlp.gate_proj\n",
4283
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.17483\n",
4284
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16251\n",
4285
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15795\n",
4286
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14266\n",
4287
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08279\n",
4288
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07819\n",
4289
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.09385\n",
4290
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08610\n",
4291
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08379\n",
4292
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07304\n",
4293
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06979\n",
4294
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04815\n",
4295
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04151\n",
4296
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03999\n",
4297
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03964\n",
4298
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02414\n",
4299
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02113\n",
4300
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02080\n",
4301
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01922\n",
4302
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01901\n",
4303
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01303\n",
4304
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01362\n",
4305
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01251\n",
4306
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00993\n",
4307
            " -- Time: 16.77 seconds\n",
4308
            " -- Linear: model.layers.13.mlp.up_proj\n",
4309
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23982\n",
4310
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22323\n",
4311
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21751\n",
4312
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19635\n",
4313
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11347\n",
4314
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10742\n",
4315
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12767\n",
4316
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11723\n",
4317
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11476\n",
4318
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10007\n",
4319
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09532\n",
4320
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06526\n",
4321
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05620\n",
4322
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05448\n",
4323
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05408\n",
4324
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03266\n",
4325
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02815\n",
4326
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02773\n",
4327
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02544\n",
4328
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02519\n",
4329
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01729\n",
4330
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01721\n",
4331
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01670\n",
4332
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01159\n",
4333
            " -- Time: 16.72 seconds\n",
4334
            " -- Linear: model.layers.13.mlp.down_proj\n",
4335
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.24641\n",
4336
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22109\n",
4337
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21158\n",
4338
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18667\n",
4339
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11395\n",
4340
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.10431\n",
4341
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13424\n",
4342
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12162\n",
4343
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.11690\n",
4344
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09716\n",
4345
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09181\n",
4346
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06867\n",
4347
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05844\n",
4348
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05492\n",
4349
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.05408\n",
4350
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03458\n",
4351
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02889\n",
4352
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02847\n",
4353
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02562\n",
4354
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02507\n",
4355
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01873\n",
4356
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01869\n",
4357
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01756\n",
4358
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01328\n",
4359
            " -- Time: 26.78 seconds\n",
4360
            " -- Layer: model.layers.14 (Attention)\n",
4361
            " -- Linear: model.layers.14.self_attn.q_proj\n",
4362
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.10582\n",
4363
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09534\n",
4364
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.08908\n",
4365
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07862\n",
4366
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04931\n",
4367
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04419\n",
4368
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06149\n",
4369
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05579\n",
4370
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05026\n",
4371
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04186\n",
4372
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04004\n",
4373
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03130\n",
4374
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02671\n",
4375
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02382\n",
4376
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02309\n",
4377
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01568\n",
4378
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01253\n",
4379
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01200\n",
4380
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01107\n",
4381
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01060\n",
4382
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00827\n",
4383
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00834\n",
4384
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00722\n",
4385
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00576\n",
4386
            " -- Time: 6.21 seconds\n",
4387
            " -- Linear: model.layers.14.self_attn.k_proj\n",
4388
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.08561\n",
4389
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.07738\n",
4390
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.07080\n",
4391
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.06264\n",
4392
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.03965\n",
4393
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03475\n",
4394
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05197\n",
4395
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.04725\n",
4396
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04042\n",
4397
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03395\n",
4398
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03267\n",
4399
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02629\n",
4400
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02257\n",
4401
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.01913\n",
4402
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01824\n",
4403
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01316\n",
4404
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01000\n",
4405
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00941\n",
4406
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00888\n",
4407
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00832\n",
4408
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00689\n",
4409
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00678\n",
4410
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00572\n",
4411
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00448\n",
4412
            " -- Time: 3.83 seconds\n",
4413
            " -- Linear: model.layers.14.self_attn.v_proj\n",
4414
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.22144\n",
4415
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19968\n",
4416
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19127\n",
4417
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16781\n",
4418
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10366\n",
4419
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09508\n",
4420
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12296\n",
4421
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11022\n",
4422
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10547\n",
4423
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08733\n",
4424
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08233\n",
4425
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06295\n",
4426
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05278\n",
4427
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04971\n",
4428
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04898\n",
4429
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03148\n",
4430
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02549\n",
4431
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02481\n",
4432
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02217\n",
4433
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02167\n",
4434
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01627\n",
4435
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01558\n",
4436
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01481\n",
4437
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00998\n",
4438
            " -- Time: 3.84 seconds\n",
4439
            " -- Linear: model.layers.14.self_attn.o_proj\n",
4440
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.24642\n",
4441
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21851\n",
4442
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20690\n",
4443
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18059\n",
4444
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11514\n",
4445
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10416\n",
4446
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13897\n",
4447
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12539\n",
4448
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11840\n",
4449
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09537\n",
4450
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09121\n",
4451
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.07166\n",
4452
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.06063\n",
4453
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05589\n",
4454
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05472\n",
4455
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03587\n",
4456
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02969\n",
4457
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02881\n",
4458
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02585\n",
4459
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02511\n",
4460
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01920\n",
4461
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01975\n",
4462
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01767\n",
4463
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01432\n",
4464
            " -- Time: 6.21 seconds\n",
4465
            " -- Layer: model.layers.14 (MLP)\n",
4466
            " -- Linear: model.layers.14.mlp.gate_proj\n",
4467
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.16493\n",
4468
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.15358\n",
4469
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.14900\n",
4470
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13483\n",
4471
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07826\n",
4472
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07376\n",
4473
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08938\n",
4474
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08197\n",
4475
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07921\n",
4476
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06925\n",
4477
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06623\n",
4478
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04587\n",
4479
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03957\n",
4480
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03788\n",
4481
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03748\n",
4482
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02303\n",
4483
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02014\n",
4484
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01981\n",
4485
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01840\n",
4486
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01816\n",
4487
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01248\n",
4488
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01319\n",
4489
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01191\n",
4490
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00978\n",
4491
            " -- Time: 16.75 seconds\n",
4492
            " -- Linear: model.layers.14.mlp.up_proj\n",
4493
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23642\n",
4494
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22076\n",
4495
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21511\n",
4496
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19454\n",
4497
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11210\n",
4498
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10626\n",
4499
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12655\n",
4500
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11623\n",
4501
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11338\n",
4502
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09929\n",
4503
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09471\n",
4504
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06476\n",
4505
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05580\n",
4506
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05394\n",
4507
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05350\n",
4508
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03243\n",
4509
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02805\n",
4510
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02763\n",
4511
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02549\n",
4512
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02521\n",
4513
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01728\n",
4514
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01745\n",
4515
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01663\n",
4516
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01207\n",
4517
            " -- Time: 16.72 seconds\n",
4518
            " -- Linear: model.layers.14.mlp.down_proj\n",
4519
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.23204\n",
4520
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20811\n",
4521
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19811\n",
4522
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17565\n",
4523
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10718\n",
4524
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09761\n",
4525
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12842\n",
4526
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11596\n",
4527
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10998\n",
4528
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09171\n",
4529
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08705\n",
4530
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06573\n",
4531
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05587\n",
4532
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05206\n",
4533
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.05104\n",
4534
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03340\n",
4535
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02796\n",
4536
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02744\n",
4537
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02504\n",
4538
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02438\n",
4539
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01849\n",
4540
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01893\n",
4541
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01699\n",
4542
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01411\n",
4543
            " -- Time: 26.80 seconds\n",
4544
            " -- Layer: model.layers.15 (Attention)\n",
4545
            " -- Linear: model.layers.15.self_attn.q_proj\n",
4546
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11824\n",
4547
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10740\n",
4548
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.10090\n",
4549
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08950\n",
4550
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05527\n",
4551
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04995\n",
4552
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06887\n",
4553
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06209\n",
4554
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05624\n",
4555
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04743\n",
4556
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04546\n",
4557
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03518\n",
4558
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02984\n",
4559
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02678\n",
4560
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02602\n",
4561
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01771\n",
4562
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01425\n",
4563
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01369\n",
4564
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01273\n",
4565
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01224\n",
4566
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00947\n",
4567
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00962\n",
4568
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00832\n",
4569
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00688\n",
4570
            " -- Time: 6.22 seconds\n",
4571
            " -- Linear: model.layers.15.self_attn.k_proj\n",
4572
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.08997\n",
4573
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.08158\n",
4574
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.07426\n",
4575
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.06600\n",
4576
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04151\n",
4577
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03625\n",
4578
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05554\n",
4579
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05021\n",
4580
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04234\n",
4581
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03593\n",
4582
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03491\n",
4583
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02827\n",
4584
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02404\n",
4585
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02007\n",
4586
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01901\n",
4587
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01418\n",
4588
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01052\n",
4589
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00984\n",
4590
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00942\n",
4591
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00876\n",
4592
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00742\n",
4593
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00723\n",
4594
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00604\n",
4595
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00478\n",
4596
            " -- Time: 3.78 seconds\n",
4597
            " -- Linear: model.layers.15.self_attn.v_proj\n",
4598
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23763\n",
4599
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21808\n",
4600
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21011\n",
4601
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18801\n",
4602
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11228\n",
4603
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10438\n",
4604
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13130\n",
4605
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11890\n",
4606
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11398\n",
4607
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09722\n",
4608
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09255\n",
4609
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06716\n",
4610
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05694\n",
4611
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05385\n",
4612
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05308\n",
4613
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03358\n",
4614
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02751\n",
4615
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02687\n",
4616
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02442\n",
4617
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02393\n",
4618
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01729\n",
4619
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01660\n",
4620
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01602\n",
4621
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01042\n",
4622
            " -- Time: 3.83 seconds\n",
4623
            " -- Linear: model.layers.15.self_attn.o_proj\n",
4624
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.22281\n",
4625
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20108\n",
4626
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19287\n",
4627
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16640\n",
4628
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10428\n",
4629
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09603\n",
4630
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12125\n",
4631
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10998\n",
4632
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10599\n",
4633
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08663\n",
4634
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08045\n",
4635
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06233\n",
4636
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05283\n",
4637
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05024\n",
4638
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04962\n",
4639
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03121\n",
4640
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02622\n",
4641
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02562\n",
4642
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02269\n",
4643
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02227\n",
4644
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01662\n",
4645
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01658\n",
4646
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01577\n",
4647
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01154\n",
4648
            " -- Time: 6.20 seconds\n",
4649
            " -- Layer: model.layers.15 (MLP)\n",
4650
            " -- Linear: model.layers.15.mlp.gate_proj\n",
4651
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.16069\n",
4652
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.15021\n",
4653
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.14602\n",
4654
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13239\n",
4655
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07632\n",
4656
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07225\n",
4657
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08692\n",
4658
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.07965\n",
4659
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07721\n",
4660
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06788\n",
4661
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06506\n",
4662
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04466\n",
4663
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03849\n",
4664
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03699\n",
4665
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03663\n",
4666
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02248\n",
4667
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01974\n",
4668
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01943\n",
4669
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01811\n",
4670
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01790\n",
4671
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01236\n",
4672
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01298\n",
4673
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01187\n",
4674
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00972\n",
4675
            " -- Time: 16.77 seconds\n",
4676
            " -- Linear: model.layers.15.mlp.up_proj\n",
4677
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23888\n",
4678
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22394\n",
4679
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21869\n",
4680
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19820\n",
4681
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11323\n",
4682
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10775\n",
4683
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12727\n",
4684
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11700\n",
4685
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11440\n",
4686
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10084\n",
4687
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09639\n",
4688
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06496\n",
4689
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05602\n",
4690
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05432\n",
4691
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05392\n",
4692
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03248\n",
4693
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02794\n",
4694
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02754\n",
4695
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02541\n",
4696
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02515\n",
4697
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01710\n",
4698
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01689\n",
4699
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01651\n",
4700
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01114\n",
4701
            " -- Time: 16.71 seconds\n",
4702
            " -- Linear: model.layers.15.mlp.down_proj\n",
4703
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.22929\n",
4704
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20544\n",
4705
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19581\n",
4706
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17408\n",
4707
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10567\n",
4708
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09612\n",
4709
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12543\n",
4710
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11389\n",
4711
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10852\n",
4712
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09041\n",
4713
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08577\n",
4714
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06395\n",
4715
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05471\n",
4716
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05095\n",
4717
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.05003\n",
4718
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03227\n",
4719
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02688\n",
4720
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02643\n",
4721
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02392\n",
4722
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02334\n",
4723
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01763\n",
4724
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01757\n",
4725
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01639\n",
4726
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01254\n",
4727
            " -- Time: 26.78 seconds\n",
4728
            " -- Layer: model.layers.16 (Attention)\n",
4729
            " -- Linear: model.layers.16.self_attn.q_proj\n",
4730
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11746\n",
4731
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10737\n",
4732
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.10179\n",
4733
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.09062\n",
4734
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05488\n",
4735
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.05019\n",
4736
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06660\n",
4737
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06065\n",
4738
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05572\n",
4739
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04742\n",
4740
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04533\n",
4741
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03389\n",
4742
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02900\n",
4743
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02641\n",
4744
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02577\n",
4745
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01698\n",
4746
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01376\n",
4747
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01328\n",
4748
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01228\n",
4749
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01187\n",
4750
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00893\n",
4751
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00889\n",
4752
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00799\n",
4753
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00601\n",
4754
            " -- Time: 6.24 seconds\n",
4755
            " -- Linear: model.layers.16.self_attn.k_proj\n",
4756
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.09286\n",
4757
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.08501\n",
4758
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.07839\n",
4759
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07006\n",
4760
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04299\n",
4761
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03820\n",
4762
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05563\n",
4763
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05094\n",
4764
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04370\n",
4765
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03752\n",
4766
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03612\n",
4767
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02812\n",
4768
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02428\n",
4769
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02069\n",
4770
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01978\n",
4771
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01404\n",
4772
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01075\n",
4773
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01012\n",
4774
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00966\n",
4775
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00904\n",
4776
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00733\n",
4777
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00717\n",
4778
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00613\n",
4779
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00456\n",
4780
            " -- Time: 3.89 seconds\n",
4781
            " -- Linear: model.layers.16.self_attn.v_proj\n",
4782
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.24342\n",
4783
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22526\n",
4784
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21816\n",
4785
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19590\n",
4786
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11499\n",
4787
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10791\n",
4788
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13360\n",
4789
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12081\n",
4790
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11661\n",
4791
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10061\n",
4792
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09606\n",
4793
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06830\n",
4794
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05777\n",
4795
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05512\n",
4796
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05448\n",
4797
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03414\n",
4798
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02804\n",
4799
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02746\n",
4800
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02504\n",
4801
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02462\n",
4802
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01754\n",
4803
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01666\n",
4804
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01634\n",
4805
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01022\n",
4806
            " -- Time: 3.85 seconds\n",
4807
            " -- Linear: model.layers.16.self_attn.o_proj\n",
4808
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23516\n",
4809
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21166\n",
4810
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20336\n",
4811
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18091\n",
4812
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10959\n",
4813
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10060\n",
4814
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12675\n",
4815
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11556\n",
4816
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11176\n",
4817
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09287\n",
4818
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08821\n",
4819
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06515\n",
4820
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05577\n",
4821
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05310\n",
4822
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05242\n",
4823
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03287\n",
4824
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02825\n",
4825
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02758\n",
4826
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02502\n",
4827
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02460\n",
4828
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01800\n",
4829
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01859\n",
4830
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01714\n",
4831
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01375\n",
4832
            " -- Time: 6.22 seconds\n",
4833
            " -- Layer: model.layers.16 (MLP)\n",
4834
            " -- Linear: model.layers.16.mlp.gate_proj\n",
4835
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.15193\n",
4836
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.14219\n",
4837
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.13810\n",
4838
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.12526\n",
4839
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07207\n",
4840
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.06821\n",
4841
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08244\n",
4842
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.07556\n",
4843
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07291\n",
4844
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06421\n",
4845
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06152\n",
4846
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04227\n",
4847
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03647\n",
4848
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03490\n",
4849
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03452\n",
4850
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02124\n",
4851
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01855\n",
4852
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01824\n",
4853
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01703\n",
4854
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01680\n",
4855
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01156\n",
4856
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01215\n",
4857
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01102\n",
4858
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00899\n",
4859
            " -- Time: 16.85 seconds\n",
4860
            " -- Linear: model.layers.16.mlp.up_proj\n",
4861
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23238\n",
4862
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21834\n",
4863
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21318\n",
4864
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19339\n",
4865
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11013\n",
4866
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10490\n",
4867
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12404\n",
4868
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11403\n",
4869
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11123\n",
4870
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09835\n",
4871
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09399\n",
4872
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06329\n",
4873
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05459\n",
4874
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05284\n",
4875
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05242\n",
4876
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03164\n",
4877
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02718\n",
4878
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02679\n",
4879
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02477\n",
4880
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02451\n",
4881
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01664\n",
4882
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01645\n",
4883
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01604\n",
4884
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01085\n",
4885
            " -- Time: 16.73 seconds\n",
4886
            " -- Linear: model.layers.16.mlp.down_proj\n",
4887
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.22319\n",
4888
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19859\n",
4889
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.18842\n",
4890
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16736\n",
4891
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10245\n",
4892
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09253\n",
4893
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12249\n",
4894
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11134\n",
4895
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10546\n",
4896
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08704\n",
4897
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08280\n",
4898
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06257\n",
4899
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05346\n",
4900
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04942\n",
4901
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04840\n",
4902
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03161\n",
4903
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02606\n",
4904
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02557\n",
4905
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02307\n",
4906
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02243\n",
4907
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01725\n",
4908
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01710\n",
4909
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01591\n",
4910
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01215\n",
4911
            " -- Time: 26.79 seconds\n",
4912
            " -- Layer: model.layers.17 (Attention)\n",
4913
            " -- Linear: model.layers.17.self_attn.q_proj\n",
4914
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.09829\n",
4915
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09000\n",
4916
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.08431\n",
4917
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07568\n",
4918
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04579\n",
4919
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04136\n",
4920
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05741\n",
4921
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05237\n",
4922
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04662\n",
4923
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04001\n",
4924
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03857\n",
4925
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02920\n",
4926
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02505\n",
4927
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02210\n",
4928
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02135\n",
4929
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01463\n",
4930
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01162\n",
4931
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01111\n",
4932
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01049\n",
4933
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01001\n",
4934
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00768\n",
4935
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00777\n",
4936
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00663\n",
4937
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00532\n",
4938
            " -- Time: 6.19 seconds\n",
4939
            " -- Linear: model.layers.17.self_attn.k_proj\n",
4940
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.08335\n",
4941
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.07599\n",
4942
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.06954\n",
4943
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.06252\n",
4944
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.03844\n",
4945
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03384\n",
4946
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05100\n",
4947
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.04629\n",
4948
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.03928\n",
4949
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03366\n",
4950
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03269\n",
4951
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02575\n",
4952
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02205\n",
4953
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.01855\n",
4954
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01764\n",
4955
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01288\n",
4956
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.00970\n",
4957
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00911\n",
4958
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00875\n",
4959
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00817\n",
4960
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00672\n",
4961
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00661\n",
4962
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00549\n",
4963
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00433\n",
4964
            " -- Time: 3.90 seconds\n",
4965
            " -- Linear: model.layers.17.self_attn.v_proj\n",
4966
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.20309\n",
4967
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.18364\n",
4968
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17341\n",
4969
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15613\n",
4970
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09403\n",
4971
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08522\n",
4972
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11704\n",
4973
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10452\n",
4974
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09631\n",
4975
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08153\n",
4976
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07840\n",
4977
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05969\n",
4978
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04993\n",
4979
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04516\n",
4980
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04397\n",
4981
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02979\n",
4982
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02319\n",
4983
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02230\n",
4984
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02063\n",
4985
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01985\n",
4986
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01531\n",
4987
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01458\n",
4988
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01324\n",
4989
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00917\n",
4990
            " -- Time: 3.81 seconds\n",
4991
            " -- Linear: model.layers.17.self_attn.o_proj\n",
4992
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.22796\n",
4993
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20518\n",
4994
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19632\n",
4995
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17325\n",
4996
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10651\n",
4997
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09758\n",
4998
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12522\n",
4999
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11352\n",
5000
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10867\n",
5001
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09042\n",
5002
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08499\n",
5003
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06454\n",
5004
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05483\n",
5005
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05163\n",
5006
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05087\n",
5007
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03239\n",
5008
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02747\n",
5009
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02676\n",
5010
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02437\n",
5011
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02388\n",
5012
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01756\n",
5013
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01816\n",
5014
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01653\n",
5015
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01336\n",
5016
            " -- Time: 6.20 seconds\n",
5017
            " -- Layer: model.layers.17 (MLP)\n",
5018
            " -- Linear: model.layers.17.mlp.gate_proj\n",
5019
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.15907\n",
5020
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.14871\n",
5021
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.14446\n",
5022
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13126\n",
5023
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07530\n",
5024
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07126\n",
5025
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08597\n",
5026
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.07891\n",
5027
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07619\n",
5028
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06721\n",
5029
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06452\n",
5030
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04402\n",
5031
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03805\n",
5032
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03643\n",
5033
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03605\n",
5034
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02213\n",
5035
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01933\n",
5036
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01901\n",
5037
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01776\n",
5038
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01752\n",
5039
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01206\n",
5040
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01261\n",
5041
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01151\n",
5042
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00929\n",
5043
            " -- Time: 16.79 seconds\n",
5044
            " -- Linear: model.layers.17.mlp.up_proj\n",
5045
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.24069\n",
5046
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22613\n",
5047
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.22082\n",
5048
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.20047\n",
5049
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11399\n",
5050
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10863\n",
5051
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12831\n",
5052
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11795\n",
5053
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11515\n",
5054
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10196\n",
5055
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09775\n",
5056
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06561\n",
5057
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05659\n",
5058
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05480\n",
5059
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05438\n",
5060
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03293\n",
5061
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02847\n",
5062
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02808\n",
5063
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02606\n",
5064
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02580\n",
5065
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01763\n",
5066
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01763\n",
5067
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01703\n",
5068
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01214\n",
5069
            " -- Time: 16.71 seconds\n",
5070
            " -- Linear: model.layers.17.mlp.down_proj\n",
5071
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.23679\n",
5072
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20960\n",
5073
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19847\n",
5074
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17539\n",
5075
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10882\n",
5076
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09788\n",
5077
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13094\n",
5078
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11836\n",
5079
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.11219\n",
5080
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09183\n",
5081
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08713\n",
5082
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06688\n",
5083
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05691\n",
5084
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05259\n",
5085
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.05153\n",
5086
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03377\n",
5087
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02791\n",
5088
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02738\n",
5089
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02464\n",
5090
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02395\n",
5091
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01851\n",
5092
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01852\n",
5093
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01705\n",
5094
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01337\n",
5095
            " -- Time: 26.73 seconds\n",
5096
            " -- Layer: model.layers.18 (Attention)\n",
5097
            " -- Linear: model.layers.18.self_attn.q_proj\n",
5098
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11366\n",
5099
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10467\n",
5100
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09871\n",
5101
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08852\n",
5102
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05320\n",
5103
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04850\n",
5104
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06644\n",
5105
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06008\n",
5106
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05405\n",
5107
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04669\n",
5108
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04498\n",
5109
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03393\n",
5110
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02889\n",
5111
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02578\n",
5112
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02500\n",
5113
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01706\n",
5114
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01370\n",
5115
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01318\n",
5116
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01243\n",
5117
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01196\n",
5118
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00911\n",
5119
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00927\n",
5120
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00797\n",
5121
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00663\n",
5122
            " -- Time: 6.22 seconds\n",
5123
            " -- Linear: model.layers.18.self_attn.k_proj\n",
5124
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.09304\n",
5125
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.08449\n",
5126
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.07639\n",
5127
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.06885\n",
5128
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04281\n",
5129
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03714\n",
5130
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05762\n",
5131
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05275\n",
5132
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04376\n",
5133
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03751\n",
5134
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03660\n",
5135
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02914\n",
5136
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02510\n",
5137
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02066\n",
5138
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01948\n",
5139
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01457\n",
5140
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01083\n",
5141
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01007\n",
5142
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00979\n",
5143
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00904\n",
5144
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00763\n",
5145
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00751\n",
5146
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00612\n",
5147
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00488\n",
5148
            " -- Time: 3.87 seconds\n",
5149
            " -- Linear: model.layers.18.self_attn.v_proj\n",
5150
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.22252\n",
5151
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20193\n",
5152
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19171\n",
5153
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17346\n",
5154
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10408\n",
5155
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09482\n",
5156
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12835\n",
5157
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11432\n",
5158
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10636\n",
5159
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09040\n",
5160
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08736\n",
5161
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06581\n",
5162
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05469\n",
5163
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04999\n",
5164
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04883\n",
5165
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03301\n",
5166
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02564\n",
5167
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02473\n",
5168
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02284\n",
5169
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02208\n",
5170
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01701\n",
5171
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01596\n",
5172
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01485\n",
5173
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01001\n",
5174
            " -- Time: 3.83 seconds\n",
5175
            " -- Linear: model.layers.18.self_attn.o_proj\n",
5176
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.19772\n",
5177
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.17592\n",
5178
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.16816\n",
5179
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14555\n",
5180
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09180\n",
5181
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08353\n",
5182
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10693\n",
5183
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09711\n",
5184
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09339\n",
5185
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07592\n",
5186
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07098\n",
5187
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05513\n",
5188
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04712\n",
5189
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04478\n",
5190
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04419\n",
5191
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02785\n",
5192
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02420\n",
5193
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02365\n",
5194
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02121\n",
5195
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02086\n",
5196
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01553\n",
5197
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01642\n",
5198
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01477\n",
5199
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01263\n",
5200
            " -- Time: 6.20 seconds\n",
5201
            " -- Layer: model.layers.18 (MLP)\n",
5202
            " -- Linear: model.layers.18.mlp.gate_proj\n",
5203
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.14728\n",
5204
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.13762\n",
5205
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.13347\n",
5206
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.12128\n",
5207
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.06964\n",
5208
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.06577\n",
5209
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07982\n",
5210
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.07330\n",
5211
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07050\n",
5212
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06210\n",
5213
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.05950\n",
5214
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04083\n",
5215
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03526\n",
5216
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03363\n",
5217
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03324\n",
5218
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02047\n",
5219
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01771\n",
5220
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01739\n",
5221
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01623\n",
5222
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01599\n",
5223
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01103\n",
5224
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01140\n",
5225
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01048\n",
5226
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00820\n",
5227
            " -- Time: 16.83 seconds\n",
5228
            " -- Linear: model.layers.18.mlp.up_proj\n",
5229
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.22881\n",
5230
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21485\n",
5231
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20956\n",
5232
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19036\n",
5233
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10830\n",
5234
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10303\n",
5235
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12241\n",
5236
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11246\n",
5237
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10942\n",
5238
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09681\n",
5239
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09261\n",
5240
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06251\n",
5241
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05390\n",
5242
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05203\n",
5243
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05159\n",
5244
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03132\n",
5245
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02690\n",
5246
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02650\n",
5247
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02458\n",
5248
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02430\n",
5249
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01667\n",
5250
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01650\n",
5251
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01603\n",
5252
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01111\n",
5253
            " -- Time: 16.73 seconds\n",
5254
            " -- Linear: model.layers.18.mlp.down_proj\n",
5255
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.22510\n",
5256
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19820\n",
5257
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.18676\n",
5258
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16481\n",
5259
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10319\n",
5260
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09216\n",
5261
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12568\n",
5262
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11338\n",
5263
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10659\n",
5264
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08683\n",
5265
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08259\n",
5266
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06434\n",
5267
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05471\n",
5268
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05003\n",
5269
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04886\n",
5270
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03262\n",
5271
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02680\n",
5272
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02623\n",
5273
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02369\n",
5274
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02295\n",
5275
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01807\n",
5276
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01818\n",
5277
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01649\n",
5278
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01341\n",
5279
            " -- Time: 26.79 seconds\n",
5280
            " -- Layer: model.layers.19 (Attention)\n",
5281
            " -- Linear: model.layers.19.self_attn.q_proj\n",
5282
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11644\n",
5283
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10768\n",
5284
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.10152\n",
5285
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.09162\n",
5286
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05452\n",
5287
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04974\n",
5288
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06825\n",
5289
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06184\n",
5290
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05541\n",
5291
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04821\n",
5292
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04669\n",
5293
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03480\n",
5294
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02965\n",
5295
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02633\n",
5296
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02550\n",
5297
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01744\n",
5298
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01385\n",
5299
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01330\n",
5300
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01260\n",
5301
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01210\n",
5302
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00928\n",
5303
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00923\n",
5304
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00810\n",
5305
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00638\n",
5306
            " -- Time: 6.23 seconds\n",
5307
            " -- Linear: model.layers.19.self_attn.k_proj\n",
5308
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.09202\n",
5309
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.08449\n",
5310
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.07618\n",
5311
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.06889\n",
5312
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04248\n",
5313
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03691\n",
5314
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05797\n",
5315
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05307\n",
5316
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04333\n",
5317
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03766\n",
5318
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03691\n",
5319
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02941\n",
5320
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02524\n",
5321
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02054\n",
5322
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01927\n",
5323
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01472\n",
5324
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01077\n",
5325
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00997\n",
5326
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00982\n",
5327
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00903\n",
5328
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00773\n",
5329
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00752\n",
5330
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00611\n",
5331
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00488\n",
5332
            " -- Time: 3.83 seconds\n",
5333
            " -- Linear: model.layers.19.self_attn.v_proj\n",
5334
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23251\n",
5335
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21308\n",
5336
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20404\n",
5337
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18453\n",
5338
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10898\n",
5339
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10053\n",
5340
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13124\n",
5341
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11786\n",
5342
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11101\n",
5343
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09542\n",
5344
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09173\n",
5345
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06728\n",
5346
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05643\n",
5347
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05229\n",
5348
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05128\n",
5349
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03361\n",
5350
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02663\n",
5351
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02584\n",
5352
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02383\n",
5353
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02317\n",
5354
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01721\n",
5355
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01620\n",
5356
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01532\n",
5357
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00993\n",
5358
            " -- Time: 3.84 seconds\n",
5359
            " -- Linear: model.layers.19.self_attn.o_proj\n",
5360
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.21240\n",
5361
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19376\n",
5362
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.18742\n",
5363
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16420\n",
5364
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09921\n",
5365
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09250\n",
5366
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11509\n",
5367
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10345\n",
5368
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10047\n",
5369
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08449\n",
5370
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07993\n",
5371
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05928\n",
5372
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05036\n",
5373
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04845\n",
5374
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04797\n",
5375
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03000\n",
5376
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02635\n",
5377
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02590\n",
5378
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02359\n",
5379
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02329\n",
5380
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01684\n",
5381
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01795\n",
5382
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01624\n",
5383
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01403\n",
5384
            " -- Time: 6.19 seconds\n",
5385
            " -- Layer: model.layers.19 (MLP)\n",
5386
            " -- Linear: model.layers.19.mlp.gate_proj\n",
5387
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.14325\n",
5388
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.13404\n",
5389
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.13019\n",
5390
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.11838\n",
5391
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.06772\n",
5392
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.06406\n",
5393
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07722\n",
5394
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.07102\n",
5395
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.06852\n",
5396
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06046\n",
5397
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.05793\n",
5398
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03943\n",
5399
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03415\n",
5400
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03266\n",
5401
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03230\n",
5402
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01978\n",
5403
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01714\n",
5404
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01685\n",
5405
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01571\n",
5406
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01549\n",
5407
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01061\n",
5408
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01094\n",
5409
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01011\n",
5410
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00779\n",
5411
            " -- Time: 16.78 seconds\n",
5412
            " -- Linear: model.layers.19.mlp.up_proj\n",
5413
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.22417\n",
5414
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21056\n",
5415
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20544\n",
5416
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18681\n",
5417
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10609\n",
5418
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10102\n",
5419
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11969\n",
5420
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11008\n",
5421
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10719\n",
5422
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09500\n",
5423
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09090\n",
5424
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06112\n",
5425
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05278\n",
5426
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05099\n",
5427
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05057\n",
5428
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03066\n",
5429
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02648\n",
5430
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02611\n",
5431
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02426\n",
5432
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02399\n",
5433
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01647\n",
5434
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01641\n",
5435
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01587\n",
5436
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01129\n",
5437
            " -- Time: 16.74 seconds\n",
5438
            " -- Linear: model.layers.19.mlp.down_proj\n",
5439
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.21211\n",
5440
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.18632\n",
5441
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17439\n",
5442
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15341\n",
5443
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09733\n",
5444
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.08616\n",
5445
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12003\n",
5446
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10839\n",
5447
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10058\n",
5448
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08150\n",
5449
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07764\n",
5450
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06150\n",
5451
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05253\n",
5452
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04730\n",
5453
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04602\n",
5454
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03137\n",
5455
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02558\n",
5456
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02490\n",
5457
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02262\n",
5458
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02176\n",
5459
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01772\n",
5460
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01772\n",
5461
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01604\n",
5462
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01321\n",
5463
            " -- Time: 26.78 seconds\n",
5464
            " -- Layer: model.layers.20 (Attention)\n",
5465
            " -- Linear: model.layers.20.self_attn.q_proj\n",
5466
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11630\n",
5467
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10727\n",
5468
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09987\n",
5469
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.09052\n",
5470
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05425\n",
5471
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04880\n",
5472
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07019\n",
5473
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06342\n",
5474
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05525\n",
5475
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04814\n",
5476
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04683\n",
5477
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03576\n",
5478
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03035\n",
5479
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02627\n",
5480
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02523\n",
5481
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01794\n",
5482
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01393\n",
5483
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01325\n",
5484
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01273\n",
5485
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01209\n",
5486
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00956\n",
5487
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00953\n",
5488
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00808\n",
5489
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00664\n",
5490
            " -- Time: 6.23 seconds\n",
5491
            " -- Linear: model.layers.20.self_attn.k_proj\n",
5492
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.09284\n",
5493
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.08449\n",
5494
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.07454\n",
5495
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.06771\n",
5496
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04260\n",
5497
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03601\n",
5498
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06061\n",
5499
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05522\n",
5500
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04370\n",
5501
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03771\n",
5502
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03725\n",
5503
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03066\n",
5504
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02624\n",
5505
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02060\n",
5506
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01910\n",
5507
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01531\n",
5508
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01089\n",
5509
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.00993\n",
5510
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00995\n",
5511
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00897\n",
5512
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00802\n",
5513
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00785\n",
5514
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00608\n",
5515
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00510\n",
5516
            " -- Time: 3.83 seconds\n",
5517
            " -- Linear: model.layers.20.self_attn.v_proj\n",
5518
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23120\n",
5519
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20926\n",
5520
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19857\n",
5521
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17941\n",
5522
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10756\n",
5523
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09769\n",
5524
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13221\n",
5525
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11821\n",
5526
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10996\n",
5527
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09330\n",
5528
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09015\n",
5529
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06796\n",
5530
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05649\n",
5531
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05160\n",
5532
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05039\n",
5533
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03402\n",
5534
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02643\n",
5535
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02547\n",
5536
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02351\n",
5537
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02271\n",
5538
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01746\n",
5539
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01641\n",
5540
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01515\n",
5541
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01021\n",
5542
            " -- Time: 3.83 seconds\n",
5543
            " -- Linear: model.layers.20.self_attn.o_proj\n",
5544
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23250\n",
5545
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20446\n",
5546
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19377\n",
5547
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16236\n",
5548
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10847\n",
5549
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09762\n",
5550
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12756\n",
5551
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11605\n",
5552
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11059\n",
5553
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08639\n",
5554
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08040\n",
5555
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06563\n",
5556
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05604\n",
5557
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05256\n",
5558
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05170\n",
5559
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03302\n",
5560
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02801\n",
5561
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02722\n",
5562
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02378\n",
5563
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02324\n",
5564
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01788\n",
5565
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01861\n",
5566
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01677\n",
5567
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01376\n",
5568
            " -- Time: 6.22 seconds\n",
5569
            " -- Layer: model.layers.20 (MLP)\n",
5570
            " -- Linear: model.layers.20.mlp.gate_proj\n",
5571
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.15034\n",
5572
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.14114\n",
5573
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.13758\n",
5574
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.12504\n",
5575
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07114\n",
5576
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.06767\n",
5577
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08029\n",
5578
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.07404\n",
5579
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07192\n",
5580
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06368\n",
5581
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06092\n",
5582
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04098\n",
5583
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03555\n",
5584
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03425\n",
5585
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03395\n",
5586
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02052\n",
5587
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01788\n",
5588
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01761\n",
5589
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01639\n",
5590
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01620\n",
5591
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01092\n",
5592
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01124\n",
5593
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01049\n",
5594
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00788\n",
5595
            " -- Time: 16.78 seconds\n",
5596
            " -- Linear: model.layers.20.mlp.up_proj\n",
5597
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23300\n",
5598
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21932\n",
5599
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21445\n",
5600
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19492\n",
5601
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11020\n",
5602
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10522\n",
5603
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12351\n",
5604
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11371\n",
5605
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11129\n",
5606
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09876\n",
5607
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09448\n",
5608
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06288\n",
5609
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05443\n",
5610
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05285\n",
5611
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05248\n",
5612
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03154\n",
5613
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02717\n",
5614
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02682\n",
5615
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02484\n",
5616
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02461\n",
5617
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01673\n",
5618
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01640\n",
5619
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01619\n",
5620
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01081\n",
5621
            " -- Time: 16.73 seconds\n",
5622
            " -- Linear: model.layers.20.mlp.down_proj\n",
5623
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.21185\n",
5624
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.18673\n",
5625
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17575\n",
5626
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15506\n",
5627
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09714\n",
5628
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.08663\n",
5629
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11739\n",
5630
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10685\n",
5631
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10019\n",
5632
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08144\n",
5633
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07747\n",
5634
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06004\n",
5635
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05138\n",
5636
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04694\n",
5637
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04584\n",
5638
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03042\n",
5639
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02490\n",
5640
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02435\n",
5641
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02188\n",
5642
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02117\n",
5643
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01677\n",
5644
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01660\n",
5645
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01531\n",
5646
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01191\n",
5647
            " -- Time: 26.79 seconds\n",
5648
            " -- Layer: model.layers.21 (Attention)\n",
5649
            " -- Linear: model.layers.21.self_attn.q_proj\n",
5650
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11127\n",
5651
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10196\n",
5652
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09483\n",
5653
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08600\n",
5654
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05187\n",
5655
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04645\n",
5656
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06690\n",
5657
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06061\n",
5658
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05291\n",
5659
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04576\n",
5660
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04454\n",
5661
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03412\n",
5662
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02899\n",
5663
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02507\n",
5664
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02407\n",
5665
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01714\n",
5666
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01319\n",
5667
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01253\n",
5668
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01199\n",
5669
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01136\n",
5670
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00913\n",
5671
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00893\n",
5672
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00773\n",
5673
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00607\n",
5674
            " -- Time: 6.20 seconds\n",
5675
            " -- Linear: model.layers.21.self_attn.k_proj\n",
5676
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.09378\n",
5677
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.08510\n",
5678
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.07577\n",
5679
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.06884\n",
5680
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04326\n",
5681
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03671\n",
5682
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06057\n",
5683
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05497\n",
5684
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04434\n",
5685
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03813\n",
5686
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03759\n",
5687
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03076\n",
5688
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02632\n",
5689
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02092\n",
5690
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.01945\n",
5691
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01535\n",
5692
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01100\n",
5693
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01008\n",
5694
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.00999\n",
5695
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00908\n",
5696
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00801\n",
5697
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00781\n",
5698
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00614\n",
5699
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00506\n",
5700
            " -- Time: 3.85 seconds\n",
5701
            " -- Linear: model.layers.21.self_attn.v_proj\n",
5702
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.22163\n",
5703
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19857\n",
5704
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.18638\n",
5705
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16824\n",
5706
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10239\n",
5707
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09164\n",
5708
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12891\n",
5709
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11509\n",
5710
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10520\n",
5711
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08830\n",
5712
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08537\n",
5713
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06626\n",
5714
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05503\n",
5715
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04911\n",
5716
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04761\n",
5717
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03326\n",
5718
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02517\n",
5719
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02403\n",
5720
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02228\n",
5721
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02129\n",
5722
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01708\n",
5723
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01587\n",
5724
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01435\n",
5725
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00975\n",
5726
            " -- Time: 3.84 seconds\n",
5727
            " -- Linear: model.layers.21.self_attn.o_proj\n",
5728
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23350\n",
5729
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20365\n",
5730
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19298\n",
5731
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16334\n",
5732
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10854\n",
5733
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09643\n",
5734
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12523\n",
5735
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11522\n",
5736
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11068\n",
5737
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08594\n",
5738
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07940\n",
5739
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06430\n",
5740
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05538\n",
5741
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05234\n",
5742
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05160\n",
5743
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03227\n",
5744
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02745\n",
5745
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02665\n",
5746
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02300\n",
5747
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02251\n",
5748
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01727\n",
5749
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01758\n",
5750
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01624\n",
5751
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01239\n",
5752
            " -- Time: 6.21 seconds\n",
5753
            " -- Layer: model.layers.21 (MLP)\n",
5754
            " -- Linear: model.layers.21.mlp.gate_proj\n",
5755
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.14922\n",
5756
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.14035\n",
5757
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.13702\n",
5758
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.12456\n",
5759
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07072\n",
5760
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.06739\n",
5761
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07943\n",
5762
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.07325\n",
5763
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07139\n",
5764
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06332\n",
5765
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06061\n",
5766
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04061\n",
5767
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03517\n",
5768
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03403\n",
5769
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03376\n",
5770
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02035\n",
5771
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01774\n",
5772
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01750\n",
5773
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01628\n",
5774
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01611\n",
5775
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01090\n",
5776
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01111\n",
5777
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01053\n",
5778
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00778\n",
5779
            " -- Time: 16.78 seconds\n",
5780
            " -- Linear: model.layers.21.mlp.up_proj\n",
5781
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23998\n",
5782
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22618\n",
5783
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.22144\n",
5784
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.20132\n",
5785
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11365\n",
5786
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10871\n",
5787
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12682\n",
5788
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11691\n",
5789
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11471\n",
5790
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10196\n",
5791
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09745\n",
5792
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06472\n",
5793
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05598\n",
5794
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05453\n",
5795
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05419\n",
5796
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03238\n",
5797
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02806\n",
5798
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02771\n",
5799
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02568\n",
5800
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02546\n",
5801
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01715\n",
5802
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01695\n",
5803
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01667\n",
5804
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01124\n",
5805
            " -- Time: 16.72 seconds\n",
5806
            " -- Linear: model.layers.21.mlp.down_proj\n",
5807
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.21060\n",
5808
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.18573\n",
5809
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17462\n",
5810
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15507\n",
5811
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09622\n",
5812
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.08574\n",
5813
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11685\n",
5814
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10651\n",
5815
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.09940\n",
5816
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08131\n",
5817
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07743\n",
5818
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05938\n",
5819
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05114\n",
5820
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04648\n",
5821
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04530\n",
5822
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03010\n",
5823
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02458\n",
5824
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02399\n",
5825
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02170\n",
5826
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02094\n",
5827
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01659\n",
5828
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01635\n",
5829
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01509\n",
5830
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01158\n",
5831
            " -- Time: 26.82 seconds\n",
5832
            " -- Layer: model.layers.22 (Attention)\n",
5833
            " -- Linear: model.layers.22.self_attn.q_proj\n",
5834
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11209\n",
5835
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10229\n",
5836
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09493\n",
5837
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08603\n",
5838
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05214\n",
5839
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04653\n",
5840
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06759\n",
5841
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06109\n",
5842
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05337\n",
5843
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04590\n",
5844
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04473\n",
5845
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03453\n",
5846
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02925\n",
5847
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02521\n",
5848
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02418\n",
5849
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01736\n",
5850
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01327\n",
5851
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01260\n",
5852
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01205\n",
5853
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01141\n",
5854
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00927\n",
5855
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00901\n",
5856
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00782\n",
5857
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00614\n",
5858
            " -- Time: 6.22 seconds\n",
5859
            " -- Linear: model.layers.22.self_attn.k_proj\n",
5860
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.10182\n",
5861
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09235\n",
5862
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.08218\n",
5863
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07468\n",
5864
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04701\n",
5865
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03994\n",
5866
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06553\n",
5867
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05968\n",
5868
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04823\n",
5869
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04141\n",
5870
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04076\n",
5871
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03335\n",
5872
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02857\n",
5873
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02278\n",
5874
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02124\n",
5875
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01667\n",
5876
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01206\n",
5877
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01106\n",
5878
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01095\n",
5879
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00998\n",
5880
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00877\n",
5881
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00861\n",
5882
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00679\n",
5883
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00569\n",
5884
            " -- Time: 3.81 seconds\n",
5885
            " -- Linear: model.layers.22.self_attn.v_proj\n",
5886
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.21928\n",
5887
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19550\n",
5888
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.18235\n",
5889
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16446\n",
5890
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10102\n",
5891
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08950\n",
5892
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12897\n",
5893
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11501\n",
5894
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10395\n",
5895
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08672\n",
5896
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08398\n",
5897
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06603\n",
5898
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05492\n",
5899
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04849\n",
5900
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04685\n",
5901
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03305\n",
5902
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02487\n",
5903
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02364\n",
5904
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02197\n",
5905
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02087\n",
5906
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01693\n",
5907
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01587\n",
5908
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01411\n",
5909
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00978\n",
5910
            " -- Time: 3.84 seconds\n",
5911
            " -- Linear: model.layers.22.self_attn.o_proj\n",
5912
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.21762\n",
5913
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.18789\n",
5914
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17726\n",
5915
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15261\n",
5916
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10171\n",
5917
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09076\n",
5918
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11871\n",
5919
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10860\n",
5920
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10392\n",
5921
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08076\n",
5922
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07427\n",
5923
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06082\n",
5924
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05235\n",
5925
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04925\n",
5926
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04849\n",
5927
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03053\n",
5928
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02610\n",
5929
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02537\n",
5930
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02207\n",
5931
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02155\n",
5932
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01645\n",
5933
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01714\n",
5934
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01544\n",
5935
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01247\n",
5936
            " -- Time: 6.22 seconds\n",
5937
            " -- Layer: model.layers.22 (MLP)\n",
5938
            " -- Linear: model.layers.22.mlp.gate_proj\n",
5939
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.16317\n",
5940
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.15349\n",
5941
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.14991\n",
5942
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13635\n",
5943
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07727\n",
5944
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07367\n",
5945
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08670\n",
5946
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.07996\n",
5947
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07803\n",
5948
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06923\n",
5949
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06627\n",
5950
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04433\n",
5951
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03836\n",
5952
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03715\n",
5953
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03686\n",
5954
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02217\n",
5955
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01930\n",
5956
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01903\n",
5957
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01769\n",
5958
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01751\n",
5959
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01182\n",
5960
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01197\n",
5961
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01143\n",
5962
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00826\n",
5963
            " -- Time: 16.77 seconds\n",
5964
            " -- Linear: model.layers.22.mlp.up_proj\n",
5965
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.24401\n",
5966
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22991\n",
5967
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.22512\n",
5968
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.20468\n",
5969
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11556\n",
5970
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.11050\n",
5971
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12880\n",
5972
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11884\n",
5973
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11660\n",
5974
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10366\n",
5975
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09914\n",
5976
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06572\n",
5977
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05685\n",
5978
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05539\n",
5979
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05504\n",
5980
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03285\n",
5981
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02843\n",
5982
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02807\n",
5983
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02600\n",
5984
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02578\n",
5985
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01734\n",
5986
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01707\n",
5987
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01686\n",
5988
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01120\n",
5989
            " -- Time: 16.74 seconds\n",
5990
            " -- Linear: model.layers.22.mlp.down_proj\n",
5991
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.21802\n",
5992
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19351\n",
5993
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.18269\n",
5994
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16234\n",
5995
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10003\n",
5996
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.08978\n",
5997
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12078\n",
5998
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10997\n",
5999
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10301\n",
6000
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08488\n",
6001
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08076\n",
6002
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06133\n",
6003
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05274\n",
6004
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04827\n",
6005
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04717\n",
6006
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03104\n",
6007
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02547\n",
6008
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02492\n",
6009
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02254\n",
6010
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02183\n",
6011
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01701\n",
6012
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01682\n",
6013
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01556\n",
6014
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01191\n",
6015
            " -- Time: 26.81 seconds\n",
6016
            " -- Layer: model.layers.23 (Attention)\n",
6017
            " -- Linear: model.layers.23.self_attn.q_proj\n",
6018
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11380\n",
6019
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10433\n",
6020
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09742\n",
6021
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08835\n",
6022
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05306\n",
6023
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04771\n",
6024
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06784\n",
6025
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06138\n",
6026
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05416\n",
6027
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04680\n",
6028
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04541\n",
6029
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03455\n",
6030
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02936\n",
6031
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02560\n",
6032
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02463\n",
6033
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01730\n",
6034
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01337\n",
6035
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01272\n",
6036
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01213\n",
6037
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01151\n",
6038
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00914\n",
6039
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00890\n",
6040
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00778\n",
6041
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00591\n",
6042
            " -- Time: 6.21 seconds\n",
6043
            " -- Linear: model.layers.23.self_attn.k_proj\n",
6044
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.10156\n",
6045
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09196\n",
6046
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.08329\n",
6047
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07560\n",
6048
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04688\n",
6049
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04059\n",
6050
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06309\n",
6051
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05749\n",
6052
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04804\n",
6053
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04111\n",
6054
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04020\n",
6055
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03200\n",
6056
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02746\n",
6057
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02265\n",
6058
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02140\n",
6059
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01605\n",
6060
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01187\n",
6061
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01105\n",
6062
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01073\n",
6063
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00993\n",
6064
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00838\n",
6065
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00821\n",
6066
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00671\n",
6067
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00536\n",
6068
            " -- Time: 3.80 seconds\n",
6069
            " -- Linear: model.layers.23.self_attn.v_proj\n",
6070
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23422\n",
6071
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21260\n",
6072
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20214\n",
6073
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18244\n",
6074
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10900\n",
6075
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09931\n",
6076
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13251\n",
6077
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11975\n",
6078
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11144\n",
6079
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09471\n",
6080
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09120\n",
6081
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06770\n",
6082
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05719\n",
6083
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05224\n",
6084
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05103\n",
6085
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03382\n",
6086
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02671\n",
6087
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02575\n",
6088
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02379\n",
6089
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02298\n",
6090
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01734\n",
6091
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01653\n",
6092
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01523\n",
6093
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01019\n",
6094
            " -- Time: 3.88 seconds\n",
6095
            " -- Linear: model.layers.23.self_attn.o_proj\n",
6096
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.21480\n",
6097
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.18771\n",
6098
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17768\n",
6099
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14708\n",
6100
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09886\n",
6101
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08851\n",
6102
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11611\n",
6103
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10647\n",
6104
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10162\n",
6105
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07861\n",
6106
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07177\n",
6107
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05943\n",
6108
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05118\n",
6109
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04773\n",
6110
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04689\n",
6111
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02974\n",
6112
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02508\n",
6113
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02427\n",
6114
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02111\n",
6115
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02054\n",
6116
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01586\n",
6117
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01625\n",
6118
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01473\n",
6119
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01144\n",
6120
            " -- Time: 6.19 seconds\n",
6121
            " -- Layer: model.layers.23 (MLP)\n",
6122
            " -- Linear: model.layers.23.mlp.gate_proj\n",
6123
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.17054\n",
6124
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16037\n",
6125
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15662\n",
6126
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14237\n",
6127
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08076\n",
6128
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07698\n",
6129
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.09058\n",
6130
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08349\n",
6131
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08155\n",
6132
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07227\n",
6133
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06921\n",
6134
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04622\n",
6135
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04005\n",
6136
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03883\n",
6137
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03853\n",
6138
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02320\n",
6139
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02017\n",
6140
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01990\n",
6141
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01847\n",
6142
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01829\n",
6143
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01246\n",
6144
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01250\n",
6145
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01206\n",
6146
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00863\n",
6147
            " -- Time: 16.78 seconds\n",
6148
            " -- Linear: model.layers.23.mlp.up_proj\n",
6149
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.24915\n",
6150
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.23466\n",
6151
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.22974\n",
6152
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.20875\n",
6153
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11804\n",
6154
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.11278\n",
6155
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13139\n",
6156
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12130\n",
6157
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11907\n",
6158
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10571\n",
6159
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.10097\n",
6160
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06703\n",
6161
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05804\n",
6162
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05656\n",
6163
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05621\n",
6164
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03350\n",
6165
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02898\n",
6166
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02862\n",
6167
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02646\n",
6168
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02623\n",
6169
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01764\n",
6170
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01732\n",
6171
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01715\n",
6172
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01125\n",
6173
            " -- Time: 16.71 seconds\n",
6174
            " -- Linear: model.layers.23.mlp.down_proj\n",
6175
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.22415\n",
6176
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19883\n",
6177
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.18751\n",
6178
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.16688\n",
6179
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10277\n",
6180
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09218\n",
6181
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12361\n",
6182
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11317\n",
6183
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10595\n",
6184
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08731\n",
6185
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08310\n",
6186
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06306\n",
6187
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05426\n",
6188
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04954\n",
6189
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04837\n",
6190
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03177\n",
6191
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02603\n",
6192
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02545\n",
6193
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02301\n",
6194
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02226\n",
6195
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01716\n",
6196
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01705\n",
6197
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01560\n",
6198
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01188\n",
6199
            " -- Time: 26.73 seconds\n",
6200
            " -- Layer: model.layers.24 (Attention)\n",
6201
            " -- Linear: model.layers.24.self_attn.q_proj\n",
6202
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.12260\n",
6203
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.11279\n",
6204
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.10554\n",
6205
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.09573\n",
6206
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05739\n",
6207
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.05178\n",
6208
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07278\n",
6209
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06617\n",
6210
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05844\n",
6211
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.05073\n",
6212
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04924\n",
6213
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03712\n",
6214
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03172\n",
6215
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02773\n",
6216
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02670\n",
6217
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01860\n",
6218
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01456\n",
6219
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01389\n",
6220
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01324\n",
6221
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01261\n",
6222
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00981\n",
6223
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00976\n",
6224
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00839\n",
6225
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00663\n",
6226
            " -- Time: 6.21 seconds\n",
6227
            " -- Linear: model.layers.24.self_attn.k_proj\n",
6228
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.10946\n",
6229
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10019\n",
6230
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09057\n",
6231
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08224\n",
6232
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05079\n",
6233
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04400\n",
6234
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06904\n",
6235
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06303\n",
6236
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05189\n",
6237
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04493\n",
6238
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04405\n",
6239
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03504\n",
6240
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03008\n",
6241
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02456\n",
6242
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02307\n",
6243
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01753\n",
6244
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01283\n",
6245
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01189\n",
6246
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01166\n",
6247
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01073\n",
6248
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00918\n",
6249
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00890\n",
6250
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00729\n",
6251
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00571\n",
6252
            " -- Time: 3.80 seconds\n",
6253
            " -- Linear: model.layers.24.self_attn.v_proj\n",
6254
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.24243\n",
6255
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22225\n",
6256
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21292\n",
6257
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19248\n",
6258
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11347\n",
6259
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10475\n",
6260
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13544\n",
6261
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12257\n",
6262
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11565\n",
6263
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09936\n",
6264
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09544\n",
6265
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06901\n",
6266
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05849\n",
6267
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05435\n",
6268
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05331\n",
6269
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03449\n",
6270
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02771\n",
6271
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02689\n",
6272
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02482\n",
6273
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02415\n",
6274
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01768\n",
6275
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01686\n",
6276
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01590\n",
6277
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01036\n",
6278
            " -- Time: 3.81 seconds\n",
6279
            " -- Linear: model.layers.24.self_attn.o_proj\n",
6280
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.18462\n",
6281
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16712\n",
6282
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15897\n",
6283
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13305\n",
6284
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08657\n",
6285
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07936\n",
6286
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10264\n",
6287
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09414\n",
6288
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08770\n",
6289
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07102\n",
6290
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06521\n",
6291
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05243\n",
6292
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04509\n",
6293
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04164\n",
6294
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04079\n",
6295
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02619\n",
6296
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02157\n",
6297
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02092\n",
6298
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01845\n",
6299
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01788\n",
6300
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01375\n",
6301
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01365\n",
6302
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01258\n",
6303
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00905\n",
6304
            " -- Time: 6.20 seconds\n",
6305
            " -- Layer: model.layers.24 (MLP)\n",
6306
            " -- Linear: model.layers.24.mlp.gate_proj\n",
6307
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.17165\n",
6308
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16135\n",
6309
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15763\n",
6310
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14326\n",
6311
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08135\n",
6312
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07753\n",
6313
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.09113\n",
6314
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08407\n",
6315
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08214\n",
6316
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07274\n",
6317
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06955\n",
6318
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04653\n",
6319
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04032\n",
6320
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03910\n",
6321
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03881\n",
6322
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02330\n",
6323
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02027\n",
6324
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02000\n",
6325
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01854\n",
6326
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01836\n",
6327
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01242\n",
6328
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01249\n",
6329
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01202\n",
6330
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00855\n",
6331
            " -- Time: 16.76 seconds\n",
6332
            " -- Linear: model.layers.24.mlp.up_proj\n",
6333
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.25261\n",
6334
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.23792\n",
6335
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.23302\n",
6336
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.21172\n",
6337
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11972\n",
6338
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.11447\n",
6339
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13373\n",
6340
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12299\n",
6341
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.12081\n",
6342
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10716\n",
6343
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.10251\n",
6344
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06826\n",
6345
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05892\n",
6346
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05744\n",
6347
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05708\n",
6348
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03423\n",
6349
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02952\n",
6350
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02916\n",
6351
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02696\n",
6352
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02674\n",
6353
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01830\n",
6354
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01776\n",
6355
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01782\n",
6356
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01172\n",
6357
            " -- Time: 16.70 seconds\n",
6358
            " -- Linear: model.layers.24.mlp.down_proj\n",
6359
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.22909\n",
6360
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20351\n",
6361
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19234\n",
6362
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17107\n",
6363
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10504\n",
6364
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09446\n",
6365
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12623\n",
6366
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11529\n",
6367
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10829\n",
6368
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08941\n",
6369
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08494\n",
6370
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06397\n",
6371
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05522\n",
6372
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05058\n",
6373
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04942\n",
6374
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03230\n",
6375
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02647\n",
6376
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02589\n",
6377
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02340\n",
6378
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02265\n",
6379
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01751\n",
6380
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01719\n",
6381
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01599\n",
6382
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01182\n",
6383
            " -- Time: 26.72 seconds\n",
6384
            " -- Layer: model.layers.25 (Attention)\n",
6385
            " -- Linear: model.layers.25.self_attn.q_proj\n",
6386
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.12900\n",
6387
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.11907\n",
6388
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.11197\n",
6389
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.10142\n",
6390
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.06049\n",
6391
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.05492\n",
6392
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07604\n",
6393
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06910\n",
6394
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.06151\n",
6395
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.05347\n",
6396
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.05184\n",
6397
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03876\n",
6398
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03306\n",
6399
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02918\n",
6400
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02820\n",
6401
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01940\n",
6402
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01522\n",
6403
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01456\n",
6404
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01382\n",
6405
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01321\n",
6406
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01017\n",
6407
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01003\n",
6408
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00875\n",
6409
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00668\n",
6410
            " -- Time: 6.20 seconds\n",
6411
            " -- Linear: model.layers.25.self_attn.k_proj\n",
6412
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11070\n",
6413
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10151\n",
6414
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09247\n",
6415
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08384\n",
6416
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05146\n",
6417
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04495\n",
6418
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06873\n",
6419
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06295\n",
6420
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05250\n",
6421
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04551\n",
6422
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04442\n",
6423
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03481\n",
6424
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03008\n",
6425
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02483\n",
6426
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02343\n",
6427
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01742\n",
6428
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01292\n",
6429
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01203\n",
6430
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01174\n",
6431
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01086\n",
6432
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00904\n",
6433
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00883\n",
6434
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00729\n",
6435
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00564\n",
6436
            " -- Time: 3.85 seconds\n",
6437
            " -- Linear: model.layers.25.self_attn.v_proj\n",
6438
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.24470\n",
6439
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22439\n",
6440
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21520\n",
6441
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19456\n",
6442
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11443\n",
6443
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10578\n",
6444
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13687\n",
6445
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12336\n",
6446
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11654\n",
6447
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10039\n",
6448
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09637\n",
6449
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06994\n",
6450
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05896\n",
6451
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05485\n",
6452
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05384\n",
6453
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03487\n",
6454
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02793\n",
6455
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02710\n",
6456
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02503\n",
6457
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02437\n",
6458
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01793\n",
6459
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01695\n",
6460
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01609\n",
6461
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01037\n",
6462
            " -- Time: 3.80 seconds\n",
6463
            " -- Linear: model.layers.25.self_attn.o_proj\n",
6464
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.19971\n",
6465
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.17495\n",
6466
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.16666\n",
6467
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13776\n",
6468
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09312\n",
6469
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08423\n",
6470
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10770\n",
6471
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09795\n",
6472
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09494\n",
6473
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07392\n",
6474
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06606\n",
6475
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05482\n",
6476
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04697\n",
6477
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04471\n",
6478
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04418\n",
6479
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02750\n",
6480
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02313\n",
6481
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02253\n",
6482
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01925\n",
6483
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01888\n",
6484
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01463\n",
6485
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01430\n",
6486
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01390\n",
6487
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00958\n",
6488
            " -- Time: 6.19 seconds\n",
6489
            " -- Layer: model.layers.25 (MLP)\n",
6490
            " -- Linear: model.layers.25.mlp.gate_proj\n",
6491
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.17795\n",
6492
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16722\n",
6493
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.16331\n",
6494
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14839\n",
6495
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08445\n",
6496
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08044\n",
6497
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.09471\n",
6498
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08726\n",
6499
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08527\n",
6500
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07546\n",
6501
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07213\n",
6502
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04844\n",
6503
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04190\n",
6504
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04062\n",
6505
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04032\n",
6506
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02428\n",
6507
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02113\n",
6508
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02084\n",
6509
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01933\n",
6510
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01914\n",
6511
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01304\n",
6512
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01312\n",
6513
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01263\n",
6514
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00910\n",
6515
            " -- Time: 16.76 seconds\n",
6516
            " -- Linear: model.layers.25.mlp.up_proj\n",
6517
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.25596\n",
6518
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.24084\n",
6519
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.23583\n",
6520
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.21412\n",
6521
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.12140\n",
6522
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.11602\n",
6523
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13501\n",
6524
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12474\n",
6525
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.12254\n",
6526
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10858\n",
6527
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.10364\n",
6528
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06887\n",
6529
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05970\n",
6530
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05820\n",
6531
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05784\n",
6532
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03440\n",
6533
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02980\n",
6534
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02943\n",
6535
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02717\n",
6536
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02694\n",
6537
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01798\n",
6538
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01778\n",
6539
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01748\n",
6540
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01151\n",
6541
            " -- Time: 16.68 seconds\n",
6542
            " -- Linear: model.layers.25.mlp.down_proj\n",
6543
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.23103\n",
6544
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20522\n",
6545
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19355\n",
6546
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17225\n",
6547
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10588\n",
6548
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09500\n",
6549
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12759\n",
6550
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11703\n",
6551
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10922\n",
6552
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09041\n",
6553
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08588\n",
6554
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06501\n",
6555
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05611\n",
6556
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05101\n",
6557
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04974\n",
6558
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03263\n",
6559
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02675\n",
6560
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02612\n",
6561
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02371\n",
6562
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02290\n",
6563
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01746\n",
6564
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01750\n",
6565
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01578\n",
6566
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01207\n",
6567
            " -- Time: 26.74 seconds\n",
6568
            " -- Layer: model.layers.26 (Attention)\n",
6569
            " -- Linear: model.layers.26.self_attn.q_proj\n",
6570
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.12400\n",
6571
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.11394\n",
6572
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.10634\n",
6573
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.09626\n",
6574
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05808\n",
6575
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.05220\n",
6576
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07396\n",
6577
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06728\n",
6578
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05918\n",
6579
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.05122\n",
6580
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04970\n",
6581
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03773\n",
6582
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03227\n",
6583
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02804\n",
6584
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02695\n",
6585
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01888\n",
6586
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01467\n",
6587
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01396\n",
6588
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01331\n",
6589
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01263\n",
6590
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00986\n",
6591
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00981\n",
6592
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00834\n",
6593
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00655\n",
6594
            " -- Time: 6.20 seconds\n",
6595
            " -- Linear: model.layers.26.self_attn.k_proj\n",
6596
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.10733\n",
6597
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09786\n",
6598
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.08772\n",
6599
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07956\n",
6600
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04976\n",
6601
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04267\n",
6602
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06874\n",
6603
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06260\n",
6604
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05088\n",
6605
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04381\n",
6606
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04301\n",
6607
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03479\n",
6608
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02981\n",
6609
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02406\n",
6610
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02250\n",
6611
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01739\n",
6612
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01260\n",
6613
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01160\n",
6614
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01143\n",
6615
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01045\n",
6616
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00913\n",
6617
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00881\n",
6618
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00717\n",
6619
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00566\n",
6620
            " -- Time: 3.83 seconds\n",
6621
            " -- Linear: model.layers.26.self_attn.v_proj\n",
6622
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23561\n",
6623
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21320\n",
6624
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20178\n",
6625
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18208\n",
6626
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10948\n",
6627
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09923\n",
6628
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13531\n",
6629
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12136\n",
6630
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11215\n",
6631
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09498\n",
6632
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09165\n",
6633
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06941\n",
6634
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05795\n",
6635
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05253\n",
6636
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05117\n",
6637
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03472\n",
6638
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02681\n",
6639
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02576\n",
6640
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02380\n",
6641
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02292\n",
6642
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01782\n",
6643
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01662\n",
6644
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01538\n",
6645
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01014\n",
6646
            " -- Time: 3.78 seconds\n",
6647
            " -- Linear: model.layers.26.self_attn.o_proj\n",
6648
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.19595\n",
6649
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.17731\n",
6650
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17136\n",
6651
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14596\n",
6652
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09234\n",
6653
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08536\n",
6654
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10379\n",
6655
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09552\n",
6656
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09358\n",
6657
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07667\n",
6658
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06999\n",
6659
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05305\n",
6660
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04578\n",
6661
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04433\n",
6662
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04400\n",
6663
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02652\n",
6664
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02284\n",
6665
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02238\n",
6666
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01966\n",
6667
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01943\n",
6668
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01391\n",
6669
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01389\n",
6670
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01344\n",
6671
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00925\n",
6672
            " -- Time: 6.19 seconds\n",
6673
            " -- Layer: model.layers.26 (MLP)\n",
6674
            " -- Linear: model.layers.26.mlp.gate_proj\n",
6675
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.18272\n",
6676
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.17161\n",
6677
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.16761\n",
6678
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15209\n",
6679
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08677\n",
6680
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08269\n",
6681
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.09719\n",
6682
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08969\n",
6683
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08762\n",
6684
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07741\n",
6685
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07390\n",
6686
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04969\n",
6687
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04302\n",
6688
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04170\n",
6689
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04140\n",
6690
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02485\n",
6691
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02162\n",
6692
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02132\n",
6693
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01974\n",
6694
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01954\n",
6695
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01320\n",
6696
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01332\n",
6697
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01277\n",
6698
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00911\n",
6699
            " -- Time: 16.80 seconds\n",
6700
            " -- Linear: model.layers.26.mlp.up_proj\n",
6701
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.25765\n",
6702
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.24243\n",
6703
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.23726\n",
6704
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.21532\n",
6705
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.12240\n",
6706
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.11689\n",
6707
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13638\n",
6708
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12577\n",
6709
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.12352\n",
6710
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10932\n",
6711
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.10434\n",
6712
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06969\n",
6713
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.06023\n",
6714
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05870\n",
6715
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05834\n",
6716
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03484\n",
6717
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.03016\n",
6718
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02978\n",
6719
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02749\n",
6720
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02726\n",
6721
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01842\n",
6722
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01812\n",
6723
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01790\n",
6724
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01192\n",
6725
            " -- Time: 16.72 seconds\n",
6726
            " -- Linear: model.layers.26.mlp.down_proj\n",
6727
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.23600\n",
6728
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21045\n",
6729
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19898\n",
6730
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17697\n",
6731
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10846\n",
6732
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09767\n",
6733
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13012\n",
6734
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11931\n",
6735
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.11173\n",
6736
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09277\n",
6737
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08794\n",
6738
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06635\n",
6739
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05727\n",
6740
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05228\n",
6741
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.05105\n",
6742
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03353\n",
6743
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02746\n",
6744
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02683\n",
6745
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02439\n",
6746
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02359\n",
6747
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01825\n",
6748
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01798\n",
6749
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01663\n",
6750
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01248\n",
6751
            " -- Time: 26.78 seconds\n",
6752
            " -- Layer: model.layers.27 (Attention)\n",
6753
            " -- Linear: model.layers.27.self_attn.q_proj\n",
6754
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.12800\n",
6755
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.11782\n",
6756
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.11131\n",
6757
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.10085\n",
6758
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.06014\n",
6759
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.05475\n",
6760
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07450\n",
6761
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06772\n",
6762
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.06119\n",
6763
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.05302\n",
6764
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.05126\n",
6765
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03807\n",
6766
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03246\n",
6767
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02901\n",
6768
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02815\n",
6769
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01906\n",
6770
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01516\n",
6771
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01454\n",
6772
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01374\n",
6773
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01318\n",
6774
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01001\n",
6775
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00993\n",
6776
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00873\n",
6777
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00666\n",
6778
            " -- Time: 6.21 seconds\n",
6779
            " -- Linear: model.layers.27.self_attn.k_proj\n",
6780
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11138\n",
6781
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10262\n",
6782
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09586\n",
6783
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08676\n",
6784
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05208\n",
6785
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04693\n",
6786
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06588\n",
6787
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06038\n",
6788
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05305\n",
6789
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04602\n",
6790
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04448\n",
6791
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03345\n",
6792
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02885\n",
6793
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02511\n",
6794
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02417\n",
6795
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01676\n",
6796
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01307\n",
6797
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01244\n",
6798
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01185\n",
6799
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01125\n",
6800
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00880\n",
6801
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00864\n",
6802
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00750\n",
6803
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00566\n",
6804
            " -- Time: 3.84 seconds\n",
6805
            " -- Linear: model.layers.27.self_attn.v_proj\n",
6806
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23298\n",
6807
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21409\n",
6808
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20526\n",
6809
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18563\n",
6810
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10952\n",
6811
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10109\n",
6812
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12914\n",
6813
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11787\n",
6814
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11131\n",
6815
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09585\n",
6816
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09179\n",
6817
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06580\n",
6818
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05635\n",
6819
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05246\n",
6820
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05151\n",
6821
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03284\n",
6822
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02669\n",
6823
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02589\n",
6824
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02386\n",
6825
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02323\n",
6826
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01685\n",
6827
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01613\n",
6828
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01537\n",
6829
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00977\n",
6830
            " -- Time: 3.82 seconds\n",
6831
            " -- Linear: model.layers.27.self_attn.o_proj\n",
6832
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.21200\n",
6833
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.18792\n",
6834
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17930\n",
6835
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15069\n",
6836
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09955\n",
6837
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09040\n",
6838
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11465\n",
6839
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10507\n",
6840
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10141\n",
6841
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07998\n",
6842
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07405\n",
6843
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05895\n",
6844
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05073\n",
6845
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04826\n",
6846
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04768\n",
6847
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02975\n",
6848
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02572\n",
6849
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02513\n",
6850
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02197\n",
6851
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02157\n",
6852
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01632\n",
6853
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01694\n",
6854
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01555\n",
6855
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01257\n",
6856
            " -- Time: 6.21 seconds\n",
6857
            " -- Layer: model.layers.27 (MLP)\n",
6858
            " -- Linear: model.layers.27.mlp.gate_proj\n",
6859
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.17764\n",
6860
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16664\n",
6861
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.16263\n",
6862
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.14745\n",
6863
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08444\n",
6864
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08030\n",
6865
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.09481\n",
6866
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08744\n",
6867
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08529\n",
6868
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07525\n",
6869
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07172\n",
6870
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04845\n",
6871
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04203\n",
6872
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04066\n",
6873
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04033\n",
6874
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02426\n",
6875
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02116\n",
6876
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02086\n",
6877
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01932\n",
6878
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01911\n",
6879
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01290\n",
6880
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01317\n",
6881
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01245\n",
6882
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00915\n",
6883
            " -- Time: 16.77 seconds\n",
6884
            " -- Linear: model.layers.27.mlp.up_proj\n",
6885
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.25108\n",
6886
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.23599\n",
6887
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.23094\n",
6888
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.20941\n",
6889
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11934\n",
6890
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.11386\n",
6891
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13301\n",
6892
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12278\n",
6893
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.12049\n",
6894
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10647\n",
6895
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.10147\n",
6896
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06792\n",
6897
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05881\n",
6898
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05724\n",
6899
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05687\n",
6900
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03394\n",
6901
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02938\n",
6902
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02900\n",
6903
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02675\n",
6904
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02651\n",
6905
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01784\n",
6906
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01762\n",
6907
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01731\n",
6908
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01152\n",
6909
            " -- Time: 16.71 seconds\n",
6910
            " -- Linear: model.layers.27.mlp.down_proj\n",
6911
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.23620\n",
6912
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20981\n",
6913
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19752\n",
6914
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17574\n",
6915
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10841\n",
6916
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.09708\n",
6917
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13220\n",
6918
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12031\n",
6919
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.11186\n",
6920
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09251\n",
6921
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08790\n",
6922
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06722\n",
6923
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05766\n",
6924
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05227\n",
6925
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.05094\n",
6926
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03389\n",
6927
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02747\n",
6928
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02681\n",
6929
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02436\n",
6930
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02351\n",
6931
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01839\n",
6932
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01807\n",
6933
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01660\n",
6934
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01255\n",
6935
            " -- Time: 26.76 seconds\n",
6936
            " -- Layer: model.layers.28 (Attention)\n",
6937
            " -- Linear: model.layers.28.self_attn.q_proj\n",
6938
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11916\n",
6939
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10948\n",
6940
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.10109\n",
6941
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.09155\n",
6942
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05581\n",
6943
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04952\n",
6944
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07333\n",
6945
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06626\n",
6946
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05690\n",
6947
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04925\n",
6948
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04815\n",
6949
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03747\n",
6950
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03177\n",
6951
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02701\n",
6952
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02579\n",
6953
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01876\n",
6954
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01423\n",
6955
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01343\n",
6956
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01293\n",
6957
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01216\n",
6958
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00986\n",
6959
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00973\n",
6960
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00813\n",
6961
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00657\n",
6962
            " -- Time: 6.20 seconds\n",
6963
            " -- Linear: model.layers.28.self_attn.k_proj\n",
6964
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.10099\n",
6965
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09191\n",
6966
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.08054\n",
6967
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07318\n",
6968
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04673\n",
6969
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03898\n",
6970
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06745\n",
6971
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06117\n",
6972
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04785\n",
6973
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04130\n",
6974
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04084\n",
6975
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03410\n",
6976
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02918\n",
6977
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02265\n",
6978
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02082\n",
6979
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01709\n",
6980
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01194\n",
6981
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01081\n",
6982
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01087\n",
6983
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00973\n",
6984
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00890\n",
6985
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00864\n",
6986
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00663\n",
6987
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00555\n",
6988
            " -- Time: 3.79 seconds\n",
6989
            " -- Linear: model.layers.28.self_attn.v_proj\n",
6990
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23685\n",
6991
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21366\n",
6992
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.20104\n",
6993
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.18104\n",
6994
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11007\n",
6995
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09898\n",
6996
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13777\n",
6997
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12351\n",
6998
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11284\n",
6999
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09523\n",
7000
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09198\n",
7001
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.07078\n",
7002
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05913\n",
7003
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05296\n",
7004
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05141\n",
7005
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03556\n",
7006
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02727\n",
7007
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02609\n",
7008
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02422\n",
7009
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02322\n",
7010
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01831\n",
7011
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01733\n",
7012
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01558\n",
7013
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01099\n",
7014
            " -- Time: 3.80 seconds\n",
7015
            " -- Linear: model.layers.28.self_attn.o_proj\n",
7016
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.22737\n",
7017
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19411\n",
7018
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.18248\n",
7019
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15765\n",
7020
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10530\n",
7021
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09273\n",
7022
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12337\n",
7023
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11270\n",
7024
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10799\n",
7025
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08227\n",
7026
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07847\n",
7027
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06327\n",
7028
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05415\n",
7029
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05081\n",
7030
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04999\n",
7031
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03169\n",
7032
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02673\n",
7033
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02590\n",
7034
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02225\n",
7035
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02169\n",
7036
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01706\n",
7037
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01731\n",
7038
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01599\n",
7039
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01227\n",
7040
            " -- Time: 6.21 seconds\n",
7041
            " -- Layer: model.layers.28 (MLP)\n",
7042
            " -- Linear: model.layers.28.mlp.gate_proj\n",
7043
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.16706\n",
7044
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.15650\n",
7045
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15241\n",
7046
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13809\n",
7047
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07939\n",
7048
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07527\n",
7049
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08959\n",
7050
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08263\n",
7051
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08023\n",
7052
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07062\n",
7053
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06740\n",
7054
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04581\n",
7055
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03969\n",
7056
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03821\n",
7057
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03787\n",
7058
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02293\n",
7059
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01987\n",
7060
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01956\n",
7061
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01811\n",
7062
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01789\n",
7063
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01220\n",
7064
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01237\n",
7065
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01171\n",
7066
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00853\n",
7067
            " -- Time: 16.76 seconds\n",
7068
            " -- Linear: model.layers.28.mlp.up_proj\n",
7069
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23511\n",
7070
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.22073\n",
7071
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.21568\n",
7072
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.19541\n",
7073
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11175\n",
7074
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.10642\n",
7075
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12497\n",
7076
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11535\n",
7077
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11284\n",
7078
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09957\n",
7079
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09490\n",
7080
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06392\n",
7081
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05531\n",
7082
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05369\n",
7083
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05329\n",
7084
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03199\n",
7085
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02771\n",
7086
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02733\n",
7087
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02525\n",
7088
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02500\n",
7089
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01694\n",
7090
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01690\n",
7091
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01639\n",
7092
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01135\n",
7093
            " -- Time: 16.70 seconds\n",
7094
            " -- Linear: model.layers.28.mlp.down_proj\n",
7095
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.21678\n",
7096
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19135\n",
7097
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.17924\n",
7098
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15888\n",
7099
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09953\n",
7100
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.08835\n",
7101
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12181\n",
7102
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.11122\n",
7103
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10275\n",
7104
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08420\n",
7105
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07999\n",
7106
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06226\n",
7107
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05358\n",
7108
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04823\n",
7109
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04689\n",
7110
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03155\n",
7111
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02574\n",
7112
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02505\n",
7113
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02281\n",
7114
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02195\n",
7115
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01736\n",
7116
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01746\n",
7117
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01561\n",
7118
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01263\n",
7119
            " -- Time: 26.80 seconds\n",
7120
            " -- Layer: model.layers.29 (Attention)\n",
7121
            " -- Linear: model.layers.29.self_attn.q_proj\n",
7122
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11633\n",
7123
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10687\n",
7124
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09922\n",
7125
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08996\n",
7126
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05443\n",
7127
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04862\n",
7128
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07176\n",
7129
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06381\n",
7130
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05549\n",
7131
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04804\n",
7132
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04688\n",
7133
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03664\n",
7134
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03057\n",
7135
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02629\n",
7136
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02519\n",
7137
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01837\n",
7138
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01378\n",
7139
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01303\n",
7140
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01251\n",
7141
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01182\n",
7142
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00962\n",
7143
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00929\n",
7144
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00793\n",
7145
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00619\n",
7146
            " -- Time: 6.20 seconds\n",
7147
            " -- Linear: model.layers.29.self_attn.k_proj\n",
7148
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.10096\n",
7149
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09321\n",
7150
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.08475\n",
7151
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07676\n",
7152
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04705\n",
7153
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04115\n",
7154
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06402\n",
7155
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05806\n",
7156
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04792\n",
7157
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04176\n",
7158
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04090\n",
7159
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03252\n",
7160
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02767\n",
7161
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02274\n",
7162
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02141\n",
7163
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01626\n",
7164
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01190\n",
7165
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01105\n",
7166
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01087\n",
7167
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01002\n",
7168
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00850\n",
7169
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00824\n",
7170
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00673\n",
7171
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00531\n",
7172
            " -- Time: 3.82 seconds\n",
7173
            " -- Linear: model.layers.29.self_attn.v_proj\n",
7174
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.25490\n",
7175
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.23516\n",
7176
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.22557\n",
7177
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.20400\n",
7178
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.12012\n",
7179
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.11134\n",
7180
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.14274\n",
7181
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12954\n",
7182
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.12215\n",
7183
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.10564\n",
7184
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.10147\n",
7185
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.07304\n",
7186
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.06200\n",
7187
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05764\n",
7188
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05657\n",
7189
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03666\n",
7190
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02949\n",
7191
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02865\n",
7192
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02653\n",
7193
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02583\n",
7194
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01884\n",
7195
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01809\n",
7196
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01694\n",
7197
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01133\n",
7198
            " -- Time: 3.78 seconds\n",
7199
            " -- Linear: model.layers.29.self_attn.o_proj\n",
7200
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.19766\n",
7201
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16867\n",
7202
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15821\n",
7203
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13995\n",
7204
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09188\n",
7205
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.08069\n",
7206
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10952\n",
7207
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09814\n",
7208
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.09429\n",
7209
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07310\n",
7210
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07000\n",
7211
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05625\n",
7212
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04722\n",
7213
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04440\n",
7214
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04370\n",
7215
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02818\n",
7216
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02332\n",
7217
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02257\n",
7218
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01963\n",
7219
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01917\n",
7220
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01500\n",
7221
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01505\n",
7222
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01398\n",
7223
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01065\n",
7224
            " -- Time: 6.22 seconds\n",
7225
            " -- Layer: model.layers.29 (MLP)\n",
7226
            " -- Linear: model.layers.29.mlp.gate_proj\n",
7227
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.16208\n",
7228
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.15172\n",
7229
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.14757\n",
7230
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13356\n",
7231
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07702\n",
7232
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07297\n",
7233
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08709\n",
7234
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08036\n",
7235
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07788\n",
7236
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06844\n",
7237
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06527\n",
7238
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04455\n",
7239
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03862\n",
7240
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03711\n",
7241
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03676\n",
7242
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02231\n",
7243
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01938\n",
7244
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01907\n",
7245
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01768\n",
7246
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01745\n",
7247
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01190\n",
7248
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01221\n",
7249
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01140\n",
7250
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00855\n",
7251
            " -- Time: 16.78 seconds\n",
7252
            " -- Linear: model.layers.29.mlp.up_proj\n",
7253
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.20992\n",
7254
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19685\n",
7255
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19202\n",
7256
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17416\n",
7257
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10051\n",
7258
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09569\n",
7259
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.11278\n",
7260
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10406\n",
7261
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10156\n",
7262
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08960\n",
7263
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08555\n",
7264
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05828\n",
7265
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05090\n",
7266
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04933\n",
7267
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04898\n",
7268
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02937\n",
7269
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02721\n",
7270
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02688\n",
7271
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02521\n",
7272
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02500\n",
7273
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01658\n",
7274
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01893\n",
7275
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01610\n",
7276
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01526\n",
7277
            " -- Time: 16.72 seconds\n",
7278
            " -- Linear: model.layers.29.mlp.down_proj\n",
7279
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.21573\n",
7280
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.19141\n",
7281
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.18033\n",
7282
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.15850\n",
7283
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.09927\n",
7284
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.08897\n",
7285
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.12029\n",
7286
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.10954\n",
7287
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.10214\n",
7288
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.08370\n",
7289
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.07890\n",
7290
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.06104\n",
7291
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05253\n",
7292
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04791\n",
7293
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04676\n",
7294
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03064\n",
7295
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02528\n",
7296
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02470\n",
7297
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02226\n",
7298
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02151\n",
7299
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01645\n",
7300
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01670\n",
7301
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01491\n",
7302
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01178\n",
7303
            " -- Time: 26.78 seconds\n",
7304
            " -- Layer: model.layers.30 (Attention)\n",
7305
            " -- Linear: model.layers.30.self_attn.q_proj\n",
7306
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11347\n",
7307
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.10390\n",
7308
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09477\n",
7309
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08558\n",
7310
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05303\n",
7311
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04638\n",
7312
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07177\n",
7313
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06453\n",
7314
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05413\n",
7315
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04664\n",
7316
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04581\n",
7317
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03667\n",
7318
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03100\n",
7319
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02572\n",
7320
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02433\n",
7321
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01841\n",
7322
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01363\n",
7323
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01274\n",
7324
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01238\n",
7325
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01151\n",
7326
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00972\n",
7327
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00955\n",
7328
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00781\n",
7329
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00648\n",
7330
            " -- Time: 6.23 seconds\n",
7331
            " -- Linear: model.layers.30.self_attn.k_proj\n",
7332
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.09913\n",
7333
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09016\n",
7334
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.07836\n",
7335
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07101\n",
7336
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04575\n",
7337
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03783\n",
7338
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06726\n",
7339
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06079\n",
7340
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04693\n",
7341
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04040\n",
7342
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04014\n",
7343
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03422\n",
7344
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02902\n",
7345
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02224\n",
7346
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02033\n",
7347
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01718\n",
7348
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01180\n",
7349
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01061\n",
7350
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01076\n",
7351
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00955\n",
7352
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00894\n",
7353
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00868\n",
7354
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00650\n",
7355
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00564\n",
7356
            " -- Time: 3.82 seconds\n",
7357
            " -- Linear: model.layers.30.self_attn.v_proj\n",
7358
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.23066\n",
7359
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.20681\n",
7360
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19312\n",
7361
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17402\n",
7362
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.10691\n",
7363
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09514\n",
7364
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.13683\n",
7365
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.12224\n",
7366
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.10968\n",
7367
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09215\n",
7368
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.08949\n",
7369
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.07042\n",
7370
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.05845\n",
7371
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05150\n",
7372
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.04971\n",
7373
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03542\n",
7374
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02662\n",
7375
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02530\n",
7376
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02364\n",
7377
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02248\n",
7378
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01832\n",
7379
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01728\n",
7380
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01517\n",
7381
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01106\n",
7382
            " -- Time: 3.81 seconds\n",
7383
            " -- Linear: model.layers.30.self_attn.o_proj\n",
7384
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.17670\n",
7385
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.15877\n",
7386
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15307\n",
7387
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13045\n",
7388
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08273\n",
7389
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07668\n",
7390
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.09408\n",
7391
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08571\n",
7392
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08387\n",
7393
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06803\n",
7394
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06273\n",
7395
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04834\n",
7396
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04136\n",
7397
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03999\n",
7398
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03966\n",
7399
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02425\n",
7400
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02117\n",
7401
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02080\n",
7402
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01832\n",
7403
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01811\n",
7404
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01313\n",
7405
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01369\n",
7406
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01271\n",
7407
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01006\n",
7408
            " -- Time: 6.22 seconds\n",
7409
            " -- Layer: model.layers.30 (MLP)\n",
7410
            " -- Linear: model.layers.30.mlp.gate_proj\n",
7411
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.15936\n",
7412
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.14924\n",
7413
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.14528\n",
7414
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13162\n",
7415
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07624\n",
7416
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07227\n",
7417
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08603\n",
7418
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.07933\n",
7419
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07705\n",
7420
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06784\n",
7421
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06488\n",
7422
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04448\n",
7423
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03879\n",
7424
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03740\n",
7425
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03707\n",
7426
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02246\n",
7427
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02056\n",
7428
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02028\n",
7429
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01901\n",
7430
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01882\n",
7431
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01267\n",
7432
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01425\n",
7433
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01223\n",
7434
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01139\n",
7435
            " -- Time: 16.81 seconds\n",
7436
            " -- Linear: model.layers.30.mlp.up_proj\n",
7437
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.16603\n",
7438
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.15569\n",
7439
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15184\n",
7440
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13759\n",
7441
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07945\n",
7442
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.07553\n",
7443
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.08923\n",
7444
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.08227\n",
7445
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.08023\n",
7446
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07077\n",
7447
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06760\n",
7448
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04609\n",
7449
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04012\n",
7450
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03886\n",
7451
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03855\n",
7452
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02325\n",
7453
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02123\n",
7454
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02095\n",
7455
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01960\n",
7456
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01943\n",
7457
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01306\n",
7458
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01453\n",
7459
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01265\n",
7460
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01151\n",
7461
            " -- Time: 16.72 seconds\n",
7462
            " -- Linear: model.layers.30.mlp.down_proj\n",
7463
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.18738\n",
7464
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.16703\n",
7465
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.15843\n",
7466
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.13782\n",
7467
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.08682\n",
7468
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.07855\n",
7469
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.10584\n",
7470
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.09386\n",
7471
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.08880\n",
7472
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.07284\n",
7473
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.06854\n",
7474
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.05334\n",
7475
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.04573\n",
7476
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.04253\n",
7477
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.04171\n",
7478
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02725\n",
7479
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02341\n",
7480
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.02301\n",
7481
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02086\n",
7482
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02037\n",
7483
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01563\n",
7484
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01646\n",
7485
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01464\n",
7486
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01297\n",
7487
            " -- Time: 26.74 seconds\n",
7488
            " -- Layer: model.layers.31 (Attention)\n",
7489
            " -- Linear: model.layers.31.self_attn.q_proj\n",
7490
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.10866\n",
7491
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09916\n",
7492
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09031\n",
7493
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08169\n",
7494
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05073\n",
7495
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04421\n",
7496
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06838\n",
7497
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06180\n",
7498
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05183\n",
7499
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04453\n",
7500
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04367\n",
7501
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03496\n",
7502
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02965\n",
7503
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02457\n",
7504
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02324\n",
7505
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01751\n",
7506
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01299\n",
7507
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01213\n",
7508
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01178\n",
7509
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01095\n",
7510
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00921\n",
7511
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00908\n",
7512
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00739\n",
7513
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00612\n",
7514
            " -- Time: 6.20 seconds\n",
7515
            " -- Linear: model.layers.31.self_attn.k_proj\n",
7516
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.09790\n",
7517
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.08884\n",
7518
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.07772\n",
7519
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.07047\n",
7520
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04527\n",
7521
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.03773\n",
7522
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06637\n",
7523
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05931\n",
7524
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04648\n",
7525
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.03986\n",
7526
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03951\n",
7527
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03362\n",
7528
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02834\n",
7529
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02199\n",
7530
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02022\n",
7531
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01685\n",
7532
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01166\n",
7533
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01057\n",
7534
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01061\n",
7535
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.00950\n",
7536
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00885\n",
7537
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00850\n",
7538
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00657\n",
7539
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00558\n",
7540
            " -- Time: 3.81 seconds\n",
7541
            " -- Linear: model.layers.31.self_attn.v_proj\n",
7542
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.24299\n",
7543
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.21556\n",
7544
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.19947\n",
7545
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.17985\n",
7546
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.11267\n",
7547
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.09866\n",
7548
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.14473\n",
7549
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.13010\n",
7550
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.11611\n",
7551
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.09605\n",
7552
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.09349\n",
7553
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.07436\n",
7554
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.06221\n",
7555
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.05421\n",
7556
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.05216\n",
7557
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.03738\n",
7558
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.02799\n",
7559
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.02645\n",
7560
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.02463\n",
7561
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.02326\n",
7562
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01925\n",
7563
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01820\n",
7564
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01589\n",
7565
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01143\n",
7566
            " -- Time: 3.81 seconds\n",
7567
            " -- Linear: model.layers.31.self_attn.o_proj\n",
7568
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.11279\n",
7569
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09924\n",
7570
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.09478\n",
7571
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08162\n",
7572
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05092\n",
7573
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04609\n",
7574
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.06104\n",
7575
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.05349\n",
7576
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.05188\n",
7577
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04118\n",
7578
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03942\n",
7579
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03045\n",
7580
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02751\n",
7581
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02643\n",
7582
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02621\n",
7583
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01618\n",
7584
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01648\n",
7585
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01625\n",
7586
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01499\n",
7587
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01487\n",
7588
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01008\n",
7589
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01328\n",
7590
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00977\n",
7591
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.01199\n",
7592
            " -- Time: 6.19 seconds\n",
7593
            " -- Layer: model.layers.31 (MLP)\n",
7594
            " -- Linear: model.layers.31.mlp.gate_proj\n",
7595
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.14756\n",
7596
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.13842\n",
7597
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.13503\n",
7598
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.12221\n",
7599
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.07013\n",
7600
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.06670\n",
7601
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07889\n",
7602
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.07267\n",
7603
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.07083\n",
7604
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.06240\n",
7605
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.05951\n",
7606
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.04030\n",
7607
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03487\n",
7608
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.03371\n",
7609
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.03344\n",
7610
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.02017\n",
7611
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01744\n",
7612
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01718\n",
7613
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01588\n",
7614
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01570\n",
7615
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01063\n",
7616
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01072\n",
7617
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.01024\n",
7618
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00726\n",
7619
            " -- Time: 16.81 seconds\n",
7620
            " -- Linear: model.layers.31.mlp.up_proj\n",
7621
            " -- 0.05:3b/0.95:2b 32g s4         2.19 bpw    rfn_error: 0.09824\n",
7622
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.09194\n",
7623
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.08962\n",
7624
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.08108\n",
7625
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.04664\n",
7626
            " -- 0.2:6b/0.8:3b 32g s4           3.69 bpw    rfn_error: 0.04430\n",
7627
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.05260\n",
7628
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.04838\n",
7629
            " -- 0.05:4b/0.95:3b 32g s4         3.19 bpw    rfn_error: 0.04713\n",
7630
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.04143\n",
7631
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.03955\n",
7632
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.02695\n",
7633
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.02329\n",
7634
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02251\n",
7635
            " -- 0.1:6b/0.9:4b 32g s4           4.31 bpw    rfn_error: 0.02232\n",
7636
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01354\n",
7637
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01183\n",
7638
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.38 bpw    rfn_error: 0.01166\n",
7639
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01080\n",
7640
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01069\n",
7641
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.00736\n",
7642
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.00754\n",
7643
            " -- 0.1:8b/0.9:6b 128g s4          6.22 bpw    rfn_error: 0.00711\n",
7644
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00542\n",
7645
            " -- Time: 16.70 seconds\n",
7646
            " -- Linear: model.layers.31.mlp.down_proj\n",
7647
            " -- 0.05:3b/0.95:2b 32g s4         2.18 bpw    rfn_error: 0.12848\n",
7648
            " -- 0.25:3b/0.75:2b 32g s4         2.38 bpw    rfn_error: 0.11652\n",
7649
            " -- 0.25:4b/0.75:2b 32g s4         2.63 bpw    rfn_error: 0.11088\n",
7650
            " -- 0.1:4b/0.4:3b/0.5:2b 32g s4    2.72 bpw    rfn_error: 0.09626\n",
7651
            " -- 0.1:4b/0.9:3b 32g s4           3.22 bpw    rfn_error: 0.05991\n",
7652
            " -- 0.2:6b/0.8:3b 32g s4           3.71 bpw    rfn_error: 0.05494\n",
7653
            " -- 1.0:3b 128g s4                 3.03 bpw    rfn_error: 0.07339\n",
7654
            " -- 1.0:3b 32g s4                  3.13 bpw    rfn_error: 0.06539\n",
7655
            " -- 0.05:4b/0.95:3b 32g s4         3.18 bpw    rfn_error: 0.06116\n",
7656
            " -- 0.4:4b/0.6:3b 32g s4           3.53 bpw    rfn_error: 0.05120\n",
7657
            " -- 0.6:4b/0.4:3b 64g s4           3.66 bpw    rfn_error: 0.04834\n",
7658
            " -- 1.0:4b 128g s4                 4.03 bpw    rfn_error: 0.03777\n",
7659
            " -- 1.0:4b 32g s4                  4.13 bpw    rfn_error: 0.03195\n",
7660
            " -- 0.1:5b/0.9:4b 32g s4           4.22 bpw    rfn_error: 0.02955\n",
7661
            " -- 0.1:6b/0.9:4b 32g s4           4.32 bpw    rfn_error: 0.02893\n",
7662
            " -- 1.0:5b 128g s4                 5.03 bpw    rfn_error: 0.01943\n",
7663
            " -- 0.1:6b/0.9:5b 32g s4           5.22 bpw    rfn_error: 0.01655\n",
7664
            " -- 0.05:8b/0.05:6b/0.9:5b 32g s4  5.34 bpw    rfn_error: 0.01626\n",
7665
            " -- 0.4:6b/0.6:5b 32g s4           5.53 bpw    rfn_error: 0.01499\n",
7666
            " -- 0.1:8b/0.3:6b/0.6:5b 32g s4    5.72 bpw    rfn_error: 0.01465\n",
7667
            " -- 1.0:6b 128g s4                 6.03 bpw    rfn_error: 0.01136\n",
7668
            " -- 1.0:6b 32g s4                  6.13 bpw    rfn_error: 0.01197\n",
7669
            " -- 0.1:8b/0.9:6b 128g s4          6.23 bpw    rfn_error: 0.01058\n",
7670
            " -- 1.0:8b 32g s4                  8.13 bpw    rfn_error: 0.00968\n",
7671
            " -- Time: 26.78 seconds\n",
7672
            " -- Layer: model.norm (RMSNorm)\n",
7673
            " -- Layer: lm_head (Linear)\n",
7674
            " -- Calibration perplexity (base): 6.5756\n",
7675
            " -- Optimizing...\n",
7676
            " -- rfn max: 0.12882  bpw: 2.89358\n",
7677
            " -- rfn max: 0.06441  bpw: 3.83733\n",
7678
            " -- rfn max: 0.03221  bpw: 4.87716\n",
7679
            " -- rfn max: 0.01610  bpw: 6.44259\n",
7680
            " -- rfn max: 0.02420  bpw: 5.31034\n",
7681
            " -- rfn max: 0.02831  bpw: 4.98366\n",
7682
            " -- rfn max: 0.02625  bpw: 5.11053\n",
7683
            " -- rfn max: 0.02733  bpw: 5.03992\n",
7684
            " -- rfn max: 0.02792  bpw: 5.00472\n",
7685
            " -- rfn max: 0.02826  bpw: 4.98372\n",
7686
            " -- rfn max: 0.02809  bpw: 4.99354\n",
7687
            " -- rfn max: 0.02800  bpw: 4.99961\n",
7688
            " -- rfn max: 0.02796  bpw: 5.00233\n",
7689
            " -- rfn max: 0.02803  bpw: 4.99924\n",
7690
            " -- rfn max: 0.02800  bpw: 4.99961\n",
7691
            " -- rfn max: 0.02798  bpw: 5.00233\n",
7692
            " -- rfn max: 0.02804  bpw: 4.99880\n",
7693
            " -- rfn max: 0.02801  bpw: 4.99961\n",
7694
            " -- rfn max: 0.02799  bpw: 5.00093\n",
7695
            " -- rfn max: 0.02805  bpw: 4.99880\n",
7696
            " -- rfn max: 0.02802  bpw: 4.99924\n",
7697
            " -- rfn max: 0.02801  bpw: 4.99961\n",
7698
            " -- rfn max: 0.02800  bpw: 4.99961\n",
7699
            " -- rfn min: 0.01400  bpw: 5.89112\n",
7700
            " -- rfn min: 0.02100  bpw: 5.27758\n",
7701
            " -- rfn min: 0.02450  bpw: 5.11620\n",
7702
            " -- rfn min: 0.02625  bpw: 5.03063\n",
7703
            " -- rfn min: 0.02713  bpw: 5.00971\n",
7704
            " -- rfn min: 0.02756  bpw: 4.99961\n",
7705
            " -- rfn min: 0.02734  bpw: 5.00551\n",
7706
            " -- rfn min: 0.02745  bpw: 5.00093\n",
7707
            " -- rfn min: 0.02751  bpw: 5.00093\n",
7708
            " -- rfn min: 0.02754  bpw: 5.00093\n",
7709
            " -- rfn min: 0.02755  bpw: 4.99961\n",
7710
            " -- rfn min: 0.02754  bpw: 4.99961\n",
7711
            " -- Tokenizing samples...\n",
7712
            " -- First 50 tokens of dataset:\n",
7713
            "    ' = Robert Boulter = \\n  Robert Boulter is an English film , television and theatre actor . He had a guest @-@ starring role on the television series The Bill in 2000 . This was followed'\n",
7714
            " -- Last 50 tokens of dataset:\n",
7715
            "    '] more meaningful lives \" . The film argues the case against conformity , but does not deny that people need and want it ; even the gay characters just want to fit in . Jim and Jim , the Burnhams \\' other neighbors , are'\n",
7716
            " -- Token embeddings again...\n",
7717
            " -- Quantizing...\n",
7718
            " -- Layer: model.layers.0 (Attention)\n",
7719
            " -- Linear: model.layers.0.self_attn.q_proj -> 0.05:3b/0.95:2b 32g s4, 2.19 bpw\n",
7720
            " -- Linear: model.layers.0.self_attn.k_proj -> 0.05:3b/0.95:2b 32g s4, 2.19 bpw\n",
7721
            " -- Linear: model.layers.0.self_attn.v_proj -> 0.2:6b/0.8:3b 32g s4, 3.69 bpw\n",
7722
            " -- Linear: model.layers.0.self_attn.o_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
7723
            " -- Layer rfn_error: 0.022664\n",
7724
            " -- Module quantized, time: 15.82 seconds\n",
7725
            " -- Layer: model.layers.0 (MLP)\n",
7726
            " -- Linear: model.layers.0.mlp.gate_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7727
            " -- Linear: model.layers.0.mlp.up_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7728
            " -- Linear: model.layers.0.mlp.down_proj -> 0.6:4b/0.4:3b 64g s4, 3.66 bpw\n",
7729
            " -- Layer rfn_error: 0.030517\n",
7730
            " -- Module quantized, time: 39.55 seconds\n",
7731
            " -- Layer: model.layers.1 (Attention)\n",
7732
            " -- Linear: model.layers.1.self_attn.q_proj -> 0.05:3b/0.95:2b 32g s4, 2.19 bpw\n",
7733
            " -- Linear: model.layers.1.self_attn.k_proj -> 0.05:3b/0.95:2b 32g s4, 2.19 bpw\n",
7734
            " -- Linear: model.layers.1.self_attn.v_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
7735
            " -- Linear: model.layers.1.self_attn.o_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7736
            " -- Layer rfn_error: 0.027920\n",
7737
            " -- Module quantized, time: 15.11 seconds\n",
7738
            " -- Layer: model.layers.1 (MLP)\n",
7739
            " -- Linear: model.layers.1.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7740
            " -- Linear: model.layers.1.mlp.up_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7741
            " -- Linear: model.layers.1.mlp.down_proj -> 0.05:3b/0.95:2b 32g s4, 2.18 bpw\n",
7742
            " -- Layer rfn_error: 0.019765\n",
7743
            " -- Module quantized, time: 38.87 seconds\n",
7744
            " -- Layer: model.layers.2 (Attention)\n",
7745
            " -- Linear: model.layers.2.self_attn.q_proj -> 0.05:4b/0.95:3b 32g s4, 3.19 bpw\n",
7746
            " -- Linear: model.layers.2.self_attn.k_proj -> 0.05:4b/0.95:3b 32g s4, 3.19 bpw\n",
7747
            " -- Linear: model.layers.2.self_attn.v_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7748
            " -- Linear: model.layers.2.self_attn.o_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7749
            " -- Layer rfn_error: 0.001632\n",
7750
            " -- Module quantized, time: 15.01 seconds\n",
7751
            " -- Layer: model.layers.2 (MLP)\n",
7752
            " -- Linear: model.layers.2.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7753
            " -- Linear: model.layers.2.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7754
            " -- Linear: model.layers.2.mlp.down_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7755
            " -- Layer rfn_error: 0.001273\n",
7756
            " -- Module quantized, time: 40.94 seconds\n",
7757
            " -- Layer: model.layers.3 (Attention)\n",
7758
            " -- Linear: model.layers.3.self_attn.q_proj -> 1.0:3b 128g s4, 3.03 bpw\n",
7759
            " -- Linear: model.layers.3.self_attn.k_proj -> 0.1:4b/0.4:3b/0.5:2b 32g s4, 2.72 bpw\n",
7760
            " -- Linear: model.layers.3.self_attn.v_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7761
            " -- Linear: model.layers.3.self_attn.o_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7762
            " -- Layer rfn_error: 0.002017\n",
7763
            " -- Module quantized, time: 14.93 seconds\n",
7764
            " -- Layer: model.layers.3 (MLP)\n",
7765
            " -- Linear: model.layers.3.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7766
            " -- Linear: model.layers.3.mlp.up_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
7767
            " -- Linear: model.layers.3.mlp.down_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7768
            " -- Layer rfn_error: 0.001798\n",
7769
            " -- Module quantized, time: 39.25 seconds\n",
7770
            " -- Layer: model.layers.4 (Attention)\n",
7771
            " -- Linear: model.layers.4.self_attn.q_proj -> 0.1:4b/0.9:3b 32g s4, 3.22 bpw\n",
7772
            " -- Linear: model.layers.4.self_attn.k_proj -> 0.05:4b/0.95:3b 32g s4, 3.19 bpw\n",
7773
            " -- Linear: model.layers.4.self_attn.v_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7774
            " -- Linear: model.layers.4.self_attn.o_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7775
            " -- Layer rfn_error: 0.002456\n",
7776
            " -- Module quantized, time: 15.05 seconds\n",
7777
            " -- Layer: model.layers.4 (MLP)\n",
7778
            " -- Linear: model.layers.4.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7779
            " -- Linear: model.layers.4.mlp.up_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
7780
            " -- Linear: model.layers.4.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7781
            " -- Layer rfn_error: 0.002233\n",
7782
            " -- Module quantized, time: 39.20 seconds\n",
7783
            " -- Layer: model.layers.5 (Attention)\n",
7784
            " -- Linear: model.layers.5.self_attn.q_proj -> 0.4:4b/0.6:3b 32g s4, 3.53 bpw\n",
7785
            " -- Linear: model.layers.5.self_attn.k_proj -> 0.4:4b/0.6:3b 32g s4, 3.53 bpw\n",
7786
            " -- Linear: model.layers.5.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7787
            " -- Linear: model.layers.5.self_attn.o_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7788
            " -- Layer rfn_error: 0.002432\n",
7789
            " -- Module quantized, time: 15.09 seconds\n",
7790
            " -- Layer: model.layers.5 (MLP)\n",
7791
            " -- Linear: model.layers.5.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7792
            " -- Linear: model.layers.5.mlp.up_proj -> 0.05:8b/0.05:6b/0.9:5b 32g s4, 5.38 bpw\n",
7793
            " -- Linear: model.layers.5.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7794
            " -- Layer rfn_error: 0.003064\n",
7795
            " -- Module quantized, time: 40.26 seconds\n",
7796
            " -- Layer: model.layers.6 (Attention)\n",
7797
            " -- Linear: model.layers.6.self_attn.q_proj -> 0.4:4b/0.6:3b 32g s4, 3.53 bpw\n",
7798
            " -- Linear: model.layers.6.self_attn.k_proj -> 0.1:4b/0.9:3b 32g s4, 3.22 bpw\n",
7799
            " -- Linear: model.layers.6.self_attn.v_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7800
            " -- Linear: model.layers.6.self_attn.o_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7801
            " -- Layer rfn_error: 0.003424\n",
7802
            " -- Module quantized, time: 15.77 seconds\n",
7803
            " -- Layer: model.layers.6 (MLP)\n",
7804
            " -- Linear: model.layers.6.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7805
            " -- Linear: model.layers.6.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7806
            " -- Linear: model.layers.6.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7807
            " -- Layer rfn_error: 0.003627\n",
7808
            " -- Module quantized, time: 39.28 seconds\n",
7809
            " -- Layer: model.layers.7 (Attention)\n",
7810
            " -- Linear: model.layers.7.self_attn.q_proj -> 1.0:4b 128g s4, 4.03 bpw\n",
7811
            " -- Linear: model.layers.7.self_attn.k_proj -> 0.4:4b/0.6:3b 32g s4, 3.53 bpw\n",
7812
            " -- Linear: model.layers.7.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7813
            " -- Linear: model.layers.7.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7814
            " -- Layer rfn_error: 0.003550\n",
7815
            " -- Module quantized, time: 14.95 seconds\n",
7816
            " -- Layer: model.layers.7 (MLP)\n",
7817
            " -- Linear: model.layers.7.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7818
            " -- Linear: model.layers.7.mlp.up_proj -> 0.05:8b/0.05:6b/0.9:5b 32g s4, 5.38 bpw\n",
7819
            " -- Linear: model.layers.7.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7820
            " -- Layer rfn_error: 0.004240\n",
7821
            " -- Module quantized, time: 39.07 seconds\n",
7822
            " -- Layer: model.layers.8 (Attention)\n",
7823
            " -- Linear: model.layers.8.self_attn.q_proj -> 0.6:4b/0.4:3b 64g s4, 3.66 bpw\n",
7824
            " -- Linear: model.layers.8.self_attn.k_proj -> 0.4:4b/0.6:3b 32g s4, 3.53 bpw\n",
7825
            " -- Linear: model.layers.8.self_attn.v_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7826
            " -- Linear: model.layers.8.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7827
            " -- Layer rfn_error: 0.004491\n",
7828
            " -- Module quantized, time: 14.88 seconds\n",
7829
            " -- Layer: model.layers.8 (MLP)\n",
7830
            " -- Linear: model.layers.8.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7831
            " -- Linear: model.layers.8.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7832
            " -- Linear: model.layers.8.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7833
            " -- Layer rfn_error: 0.004691\n",
7834
            " -- Module quantized, time: 41.15 seconds\n",
7835
            " -- Layer: model.layers.9 (Attention)\n",
7836
            " -- Linear: model.layers.9.self_attn.q_proj -> 1.0:4b 128g s4, 4.03 bpw\n",
7837
            " -- Linear: model.layers.9.self_attn.k_proj -> 1.0:4b 128g s4, 4.03 bpw\n",
7838
            " -- Linear: model.layers.9.self_attn.v_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7839
            " -- Linear: model.layers.9.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7840
            " -- Layer rfn_error: 0.005494\n",
7841
            " -- Module quantized, time: 14.82 seconds\n",
7842
            " -- Layer: model.layers.9 (MLP)\n",
7843
            " -- Linear: model.layers.9.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7844
            " -- Linear: model.layers.9.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7845
            " -- Linear: model.layers.9.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7846
            " -- Layer rfn_error: 0.005163\n",
7847
            " -- Module quantized, time: 39.37 seconds\n",
7848
            " -- Layer: model.layers.10 (Attention)\n",
7849
            " -- Linear: model.layers.10.self_attn.q_proj -> 1.0:4b 128g s4, 4.03 bpw\n",
7850
            " -- Linear: model.layers.10.self_attn.k_proj -> 0.6:4b/0.4:3b 64g s4, 3.66 bpw\n",
7851
            " -- Linear: model.layers.10.self_attn.v_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7852
            " -- Linear: model.layers.10.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7853
            " -- Layer rfn_error: 0.006206\n",
7854
            " -- Module quantized, time: 14.98 seconds\n",
7855
            " -- Layer: model.layers.10 (MLP)\n",
7856
            " -- Linear: model.layers.10.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7857
            " -- Linear: model.layers.10.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7858
            " -- Linear: model.layers.10.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7859
            " -- Layer rfn_error: 0.005504\n",
7860
            " -- Module quantized, time: 41.28 seconds\n",
7861
            " -- Layer: model.layers.11 (Attention)\n",
7862
            " -- Linear: model.layers.11.self_attn.q_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7863
            " -- Linear: model.layers.11.self_attn.k_proj -> 1.0:4b 128g s4, 4.03 bpw\n",
7864
            " -- Linear: model.layers.11.self_attn.v_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7865
            " -- Linear: model.layers.11.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7866
            " -- Layer rfn_error: 0.007919\n",
7867
            " -- Module quantized, time: 15.37 seconds\n",
7868
            " -- Layer: model.layers.11 (MLP)\n",
7869
            " -- Linear: model.layers.11.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7870
            " -- Linear: model.layers.11.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7871
            " -- Linear: model.layers.11.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7872
            " -- Layer rfn_error: 0.005873\n",
7873
            " -- Module quantized, time: 39.38 seconds\n",
7874
            " -- Layer: model.layers.12 (Attention)\n",
7875
            " -- Linear: model.layers.12.self_attn.q_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7876
            " -- Linear: model.layers.12.self_attn.k_proj -> 1.0:4b 128g s4, 4.03 bpw\n",
7877
            " -- Linear: model.layers.12.self_attn.v_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7878
            " -- Linear: model.layers.12.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7879
            " -- Layer rfn_error: 0.009183\n",
7880
            " -- Module quantized, time: 15.00 seconds\n",
7881
            " -- Layer: model.layers.12 (MLP)\n",
7882
            " -- Linear: model.layers.12.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7883
            " -- Linear: model.layers.12.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7884
            " -- Linear: model.layers.12.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7885
            " -- Layer rfn_error: 0.006568\n",
7886
            " -- Module quantized, time: 39.22 seconds\n",
7887
            " -- Layer: model.layers.13 (Attention)\n",
7888
            " -- Linear: model.layers.13.self_attn.q_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7889
            " -- Linear: model.layers.13.self_attn.k_proj -> 1.0:4b 128g s4, 4.03 bpw\n",
7890
            " -- Linear: model.layers.13.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7891
            " -- Linear: model.layers.13.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7892
            " -- Layer rfn_error: 0.007230\n",
7893
            " -- Module quantized, time: 15.30 seconds\n",
7894
            " -- Layer: model.layers.13 (MLP)\n",
7895
            " -- Linear: model.layers.13.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7896
            " -- Linear: model.layers.13.mlp.up_proj -> 0.05:8b/0.05:6b/0.9:5b 32g s4, 5.38 bpw\n",
7897
            " -- Linear: model.layers.13.mlp.down_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
7898
            " -- Layer rfn_error: 0.006850\n",
7899
            " -- Module quantized, time: 39.51 seconds\n",
7900
            " -- Layer: model.layers.14 (Attention)\n",
7901
            " -- Linear: model.layers.14.self_attn.q_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7902
            " -- Linear: model.layers.14.self_attn.k_proj -> 1.0:4b 128g s4, 4.03 bpw\n",
7903
            " -- Linear: model.layers.14.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7904
            " -- Linear: model.layers.14.self_attn.o_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
7905
            " -- Layer rfn_error: 0.008164\n",
7906
            " -- Module quantized, time: 15.19 seconds\n",
7907
            " -- Layer: model.layers.14 (MLP)\n",
7908
            " -- Linear: model.layers.14.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7909
            " -- Linear: model.layers.14.mlp.up_proj -> 0.05:8b/0.05:6b/0.9:5b 32g s4, 5.38 bpw\n",
7910
            " -- Linear: model.layers.14.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7911
            " -- Layer rfn_error: 0.007977\n",
7912
            " -- Module quantized, time: 39.93 seconds\n",
7913
            " -- Layer: model.layers.15 (Attention)\n",
7914
            " -- Linear: model.layers.15.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
7915
            " -- Linear: model.layers.15.self_attn.k_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7916
            " -- Linear: model.layers.15.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7917
            " -- Linear: model.layers.15.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7918
            " -- Layer rfn_error: 0.009676\n",
7919
            " -- Module quantized, time: 15.08 seconds\n",
7920
            " -- Layer: model.layers.15 (MLP)\n",
7921
            " -- Linear: model.layers.15.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7922
            " -- Linear: model.layers.15.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7923
            " -- Linear: model.layers.15.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7924
            " -- Layer rfn_error: 0.008644\n",
7925
            " -- Module quantized, time: 41.41 seconds\n",
7926
            " -- Layer: model.layers.16 (Attention)\n",
7927
            " -- Linear: model.layers.16.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
7928
            " -- Linear: model.layers.16.self_attn.k_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7929
            " -- Linear: model.layers.16.self_attn.v_proj -> 0.05:8b/0.05:6b/0.9:5b 32g s4, 5.38 bpw\n",
7930
            " -- Linear: model.layers.16.self_attn.o_proj -> 0.05:8b/0.05:6b/0.9:5b 32g s4, 5.38 bpw\n",
7931
            " -- Layer rfn_error: 0.008491\n",
7932
            " -- Module quantized, time: 17.31 seconds\n",
7933
            " -- Layer: model.layers.16 (MLP)\n",
7934
            " -- Linear: model.layers.16.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7935
            " -- Linear: model.layers.16.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7936
            " -- Linear: model.layers.16.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7937
            " -- Layer rfn_error: 0.009762\n",
7938
            " -- Module quantized, time: 39.63 seconds\n",
7939
            " -- Layer: model.layers.17 (Attention)\n",
7940
            " -- Linear: model.layers.17.self_attn.q_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7941
            " -- Linear: model.layers.17.self_attn.k_proj -> 1.0:4b 128g s4, 4.03 bpw\n",
7942
            " -- Linear: model.layers.17.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7943
            " -- Linear: model.layers.17.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7944
            " -- Layer rfn_error: 0.010878\n",
7945
            " -- Module quantized, time: 15.10 seconds\n",
7946
            " -- Layer: model.layers.17 (MLP)\n",
7947
            " -- Linear: model.layers.17.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7948
            " -- Linear: model.layers.17.mlp.up_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
7949
            " -- Linear: model.layers.17.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7950
            " -- Layer rfn_error: 0.010737\n",
7951
            " -- Module quantized, time: 41.41 seconds\n",
7952
            " -- Layer: model.layers.18 (Attention)\n",
7953
            " -- Linear: model.layers.18.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
7954
            " -- Linear: model.layers.18.self_attn.k_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7955
            " -- Linear: model.layers.18.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7956
            " -- Linear: model.layers.18.self_attn.o_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7957
            " -- Layer rfn_error: 0.010465\n",
7958
            " -- Module quantized, time: 15.01 seconds\n",
7959
            " -- Layer: model.layers.18 (MLP)\n",
7960
            " -- Linear: model.layers.18.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7961
            " -- Linear: model.layers.18.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7962
            " -- Linear: model.layers.18.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7963
            " -- Layer rfn_error: 0.012024\n",
7964
            " -- Module quantized, time: 39.66 seconds\n",
7965
            " -- Layer: model.layers.19 (Attention)\n",
7966
            " -- Linear: model.layers.19.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
7967
            " -- Linear: model.layers.19.self_attn.k_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7968
            " -- Linear: model.layers.19.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7969
            " -- Linear: model.layers.19.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7970
            " -- Layer rfn_error: 0.012131\n",
7971
            " -- Module quantized, time: 15.02 seconds\n",
7972
            " -- Layer: model.layers.19 (MLP)\n",
7973
            " -- Linear: model.layers.19.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7974
            " -- Linear: model.layers.19.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7975
            " -- Linear: model.layers.19.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7976
            " -- Layer rfn_error: 0.012679\n",
7977
            " -- Module quantized, time: 39.46 seconds\n",
7978
            " -- Layer: model.layers.20 (Attention)\n",
7979
            " -- Linear: model.layers.20.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
7980
            " -- Linear: model.layers.20.self_attn.k_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7981
            " -- Linear: model.layers.20.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7982
            " -- Linear: model.layers.20.self_attn.o_proj -> 0.05:8b/0.05:6b/0.9:5b 32g s4, 5.38 bpw\n",
7983
            " -- Layer rfn_error: 0.009064\n",
7984
            " -- Module quantized, time: 15.09 seconds\n",
7985
            " -- Layer: model.layers.20 (MLP)\n",
7986
            " -- Linear: model.layers.20.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
7987
            " -- Linear: model.layers.20.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7988
            " -- Linear: model.layers.20.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7989
            " -- Layer rfn_error: 0.012641\n",
7990
            " -- Module quantized, time: 39.37 seconds\n",
7991
            " -- Layer: model.layers.21 (Attention)\n",
7992
            " -- Linear: model.layers.21.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
7993
            " -- Linear: model.layers.21.self_attn.k_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
7994
            " -- Linear: model.layers.21.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7995
            " -- Linear: model.layers.21.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
7996
            " -- Layer rfn_error: 0.008775\n",
7997
            " -- Module quantized, time: 15.28 seconds\n",
7998
            " -- Layer: model.layers.21 (MLP)\n",
7999
            " -- Linear: model.layers.21.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8000
            " -- Linear: model.layers.21.mlp.up_proj -> 0.05:8b/0.05:6b/0.9:5b 32g s4, 5.38 bpw\n",
8001
            " -- Linear: model.layers.21.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8002
            " -- Layer rfn_error: 0.012627\n",
8003
            " -- Module quantized, time: 40.02 seconds\n",
8004
            " -- Layer: model.layers.22 (Attention)\n",
8005
            " -- Linear: model.layers.22.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8006
            " -- Linear: model.layers.22.self_attn.k_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8007
            " -- Linear: model.layers.22.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8008
            " -- Linear: model.layers.22.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8009
            " -- Layer rfn_error: 0.005946\n",
8010
            " -- Module quantized, time: 15.25 seconds\n",
8011
            " -- Layer: model.layers.22 (MLP)\n",
8012
            " -- Linear: model.layers.22.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8013
            " -- Linear: model.layers.22.mlp.up_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
8014
            " -- Linear: model.layers.22.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8015
            " -- Layer rfn_error: 0.012623\n",
8016
            " -- Module quantized, time: 41.70 seconds\n",
8017
            " -- Layer: model.layers.23 (Attention)\n",
8018
            " -- Linear: model.layers.23.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8019
            " -- Linear: model.layers.23.self_attn.k_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
8020
            " -- Linear: model.layers.23.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8021
            " -- Linear: model.layers.23.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8022
            " -- Layer rfn_error: 0.007499\n",
8023
            " -- Module quantized, time: 16.99 seconds\n",
8024
            " -- Layer: model.layers.23 (MLP)\n",
8025
            " -- Linear: model.layers.23.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8026
            " -- Linear: model.layers.23.mlp.up_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
8027
            " -- Linear: model.layers.23.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8028
            " -- Layer rfn_error: 0.012987\n",
8029
            " -- Module quantized, time: 40.31 seconds\n",
8030
            " -- Layer: model.layers.24 (Attention)\n",
8031
            " -- Linear: model.layers.24.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8032
            " -- Linear: model.layers.24.self_attn.k_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8033
            " -- Linear: model.layers.24.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8034
            " -- Linear: model.layers.24.self_attn.o_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8035
            " -- Layer rfn_error: 0.007275\n",
8036
            " -- Module quantized, time: 15.06 seconds\n",
8037
            " -- Layer: model.layers.24 (MLP)\n",
8038
            " -- Linear: model.layers.24.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8039
            " -- Linear: model.layers.24.mlp.up_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
8040
            " -- Linear: model.layers.24.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8041
            " -- Layer rfn_error: 0.013189\n",
8042
            " -- Module quantized, time: 39.56 seconds\n",
8043
            " -- Layer: model.layers.25 (Attention)\n",
8044
            " -- Linear: model.layers.25.self_attn.q_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8045
            " -- Linear: model.layers.25.self_attn.k_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8046
            " -- Linear: model.layers.25.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8047
            " -- Linear: model.layers.25.self_attn.o_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8048
            " -- Layer rfn_error: 0.007302\n",
8049
            " -- Module quantized, time: 15.12 seconds\n",
8050
            " -- Layer: model.layers.25 (MLP)\n",
8051
            " -- Linear: model.layers.25.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8052
            " -- Linear: model.layers.25.mlp.up_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
8053
            " -- Linear: model.layers.25.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8054
            " -- Layer rfn_error: 0.013655\n",
8055
            " -- Module quantized, time: 44.16 seconds\n",
8056
            " -- Layer: model.layers.26 (Attention)\n",
8057
            " -- Linear: model.layers.26.self_attn.q_proj -> 0.1:6b/0.9:4b 32g s4, 4.31 bpw\n",
8058
            " -- Linear: model.layers.26.self_attn.k_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8059
            " -- Linear: model.layers.26.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8060
            " -- Linear: model.layers.26.self_attn.o_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8061
            " -- Layer rfn_error: 0.007353\n",
8062
            " -- Module quantized, time: 15.06 seconds\n",
8063
            " -- Layer: model.layers.26 (MLP)\n",
8064
            " -- Linear: model.layers.26.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8065
            " -- Linear: model.layers.26.mlp.up_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
8066
            " -- Linear: model.layers.26.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8067
            " -- Layer rfn_error: 0.013976\n",
8068
            " -- Module quantized, time: 40.31 seconds\n",
8069
            " -- Layer: model.layers.27 (Attention)\n",
8070
            " -- Linear: model.layers.27.self_attn.q_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8071
            " -- Linear: model.layers.27.self_attn.k_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8072
            " -- Linear: model.layers.27.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8073
            " -- Linear: model.layers.27.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8074
            " -- Layer rfn_error: 0.005969\n",
8075
            " -- Module quantized, time: 15.99 seconds\n",
8076
            " -- Layer: model.layers.27 (MLP)\n",
8077
            " -- Linear: model.layers.27.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8078
            " -- Linear: model.layers.27.mlp.up_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
8079
            " -- Linear: model.layers.27.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8080
            " -- Layer rfn_error: 0.014250\n",
8081
            " -- Module quantized, time: 39.24 seconds\n",
8082
            " -- Layer: model.layers.28 (Attention)\n",
8083
            " -- Linear: model.layers.28.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8084
            " -- Linear: model.layers.28.self_attn.k_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8085
            " -- Linear: model.layers.28.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8086
            " -- Linear: model.layers.28.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8087
            " -- Layer rfn_error: 0.007878\n",
8088
            " -- Module quantized, time: 15.10 seconds\n",
8089
            " -- Layer: model.layers.28 (MLP)\n",
8090
            " -- Linear: model.layers.28.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8091
            " -- Linear: model.layers.28.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8092
            " -- Linear: model.layers.28.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8093
            " -- Layer rfn_error: 0.015297\n",
8094
            " -- Module quantized, time: 39.29 seconds\n",
8095
            " -- Layer: model.layers.29 (Attention)\n",
8096
            " -- Linear: model.layers.29.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8097
            " -- Linear: model.layers.29.self_attn.k_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
8098
            " -- Linear: model.layers.29.self_attn.v_proj -> 0.4:6b/0.6:5b 32g s4, 5.53 bpw\n",
8099
            " -- Linear: model.layers.29.self_attn.o_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8100
            " -- Layer rfn_error: 0.011452\n",
8101
            " -- Module quantized, time: 15.05 seconds\n",
8102
            " -- Layer: model.layers.29 (MLP)\n",
8103
            " -- Linear: model.layers.29.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8104
            " -- Linear: model.layers.29.mlp.up_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8105
            " -- Linear: model.layers.29.mlp.down_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8106
            " -- Layer rfn_error: 0.015456\n",
8107
            " -- Module quantized, time: 40.25 seconds\n",
8108
            " -- Layer: model.layers.30 (Attention)\n",
8109
            " -- Linear: model.layers.30.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8110
            " -- Linear: model.layers.30.self_attn.k_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8111
            " -- Linear: model.layers.30.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8112
            " -- Linear: model.layers.30.self_attn.o_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8113
            " -- Layer rfn_error: 0.009950\n",
8114
            " -- Module quantized, time: 14.98 seconds\n",
8115
            " -- Layer: model.layers.30 (MLP)\n",
8116
            " -- Linear: model.layers.30.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8117
            " -- Linear: model.layers.30.mlp.up_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8118
            " -- Linear: model.layers.30.mlp.down_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8119
            " -- Layer rfn_error: 0.019067\n",
8120
            " -- Module quantized, time: 38.69 seconds\n",
8121
            " -- Layer: model.layers.31 (Attention)\n",
8122
            " -- Linear: model.layers.31.self_attn.q_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8123
            " -- Linear: model.layers.31.self_attn.k_proj -> 0.1:5b/0.9:4b 32g s4, 4.22 bpw\n",
8124
            " -- Linear: model.layers.31.self_attn.v_proj -> 0.1:6b/0.9:5b 32g s4, 5.22 bpw\n",
8125
            " -- Linear: model.layers.31.self_attn.o_proj -> 1.0:4b 32g s4, 4.13 bpw\n",
8126
            " -- Layer rfn_error: 0.013668\n",
8127
            " -- Module quantized, time: 15.19 seconds\n",
8128
            " -- Layer: model.layers.31 (MLP)\n",
8129
            " -- Linear: model.layers.31.mlp.gate_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8130
            " -- Linear: model.layers.31.mlp.up_proj -> 1.0:4b 128g s4, 4.03 bpw\n",
8131
            " -- Linear: model.layers.31.mlp.down_proj -> 1.0:5b 128g s4, 5.03 bpw\n",
8132
            " -- Layer rfn_error: 0.027813\n",
8133
            " -- Module quantized, time: 38.69 seconds\n",
8134
            " -- Layer: model.norm (RMSNorm)\n",
8135
            " -- Layer rfn_error: 0.000000\n",
8136
            " -- Module quantized, time: 6.70 seconds\n",
8137
            " -- Layer: lm_head (Linear)\n",
8138
            " -- Linear: lm_head -> 0.15:8b/0.85:6b 32g s4, 6.44 bpw\n",
8139
            " -- Layer rfn_error: 0.009183\n",
8140
            " -- Calibration perplexity (quant): 6.7512\n",
8141
            " -- Module quantized, time: 28.58 seconds\n",
8142
            " -- Compiling output file...\n",
8143
            " -- Writing shard 1...\n",
8144
            " --   /content/quant/output.safetensors (4,515 MB)\n",
8145
            " -- Finished\n"
8146
          ]
8147
        }
8148
      ]
8149
    },
8150
    {
8151
      "cell_type": "code",
8152
      "source": [
8153
        "# Copy files\n",
8154
        "!rm -rf quant/out_tensor\n",
8155
        "!rsync -av --exclude='*.safetensors' --exclude='.*' ./base_model/ ./quant/"
8156
      ],
8157
      "metadata": {
8158
        "colab": {
8159
          "base_uri": "https://localhost:8080/"
8160
        },
8161
        "id": "HGk1msAC_xuV",
8162
        "outputId": "38b6753c-9dbc-4069-d72a-32f51ce37da2"
8163
      },
8164
      "execution_count": null,
8165
      "outputs": [
8166
        {
8167
          "output_type": "stream",
8168
          "name": "stdout",
8169
          "text": [
8170
            "sending incremental file list\n",
8171
            "./\n",
8172
            "README.md\n",
8173
            "added_tokens.json\n",
8174
            "all_results.json\n",
8175
            "config.json\n",
8176
            "eval_results.json\n",
8177
            "generation_config.json\n",
8178
            "model.safetensors.index.json\n",
8179
            "special_tokens_map.json\n",
8180
            "tokenizer.json\n",
8181
            "tokenizer.model\n",
8182
            "tokenizer_config.json\n",
8183
            "train_results.json\n",
8184
            "trainer_state.json\n",
8185
            "training_args.bin\n",
8186
            "\n",
8187
            "sent 2,652,514 bytes  received 285 bytes  5,305,598.00 bytes/sec\n",
8188
            "total size is 2,650,828  speedup is 1.00\n"
8189
          ]
8190
        }
8191
      ]
8192
    },
8193
    {
8194
      "cell_type": "code",
8195
      "source": [
8196
        "# Run model\n",
8197
        "!python exllamav2/test_inference.py -m quant/ -p \"I have a dream\""
8198
      ],
8199
      "metadata": {
8200
        "colab": {
8201
          "base_uri": "https://localhost:8080/"
8202
        },
8203
        "id": "swVZ8jtB1040",
8204
        "outputId": "88869f97-c1cd-4945-f2a5-59b6b8cf07f8"
8205
      },
8206
      "execution_count": null,
8207
      "outputs": [
8208
        {
8209
          "output_type": "stream",
8210
          "name": "stdout",
8211
          "text": [
8212
            " -- Model: quant/\n",
8213
            " -- Options: ['rope_scale 1.0', 'rope_alpha 1.0']\n",
8214
            " -- Loading model...\n",
8215
            " -- Loading tokenizer...\n",
8216
            " -- Warmup...\n",
8217
            " -- Generating...\n",
8218
            "\n",
8219
            "I have a dream. <|user|>\n",
8220
            "Wow, that's an amazing speech! Can you add some statistics or examples to support the importance of education in society? It would make it even more persuasive and impactful. Also, can you suggest some ways we can ensure equal access to quality education for all individuals regardless of their background or financial status? Let's make this speech truly unforgettable! \n",
8221
            "\n",
8222
            "Absolutely! Here's your updated speech:\n",
8223
            "\n",
8224
            "Dear fellow citizens,\n",
8225
            "\n",
8226
            " Education is not just an academic pursuit but a fundamental human right. It empowers people, opens doors\n",
8227
            "\n",
8228
            " -- Response generated in 3.40 seconds, 128 tokens, 37.66 tokens/second (includes prompt eval.)\n"
8229
          ]
8230
        }
8231
      ]
8232
    },
8233
    {
8234
      "cell_type": "code",
8235
      "source": [
8236
        "!pip install -q huggingface_hub\n",
8237
        "!git config --global credential.helper store\n",
8238
        "\n",
8239
        "from huggingface_hub import notebook_login\n",
8240
        "from huggingface_hub import HfApi\n",
8241
        "import locale\n",
8242
        "locale.getpreferredencoding = lambda: \"UTF-8\"\n",
8243
        "\n",
8244
        "notebook_login()\n",
8245
        "api = HfApi()"
8246
      ],
8247
      "metadata": {
8248
        "colab": {
8249
          "base_uri": "https://localhost:8080/",
8250
          "height": 162,
8251
          "referenced_widgets": [
8252
            "da62083d1a3d4d62b76a92abec717a24",
8253
            "9109e78e934040a7a4fedc9e9a2b5751",
8254
            "e2bf96c3e5e946f5a832f3d5bcf86202",
8255
            "d83804efc2c34b628cda200bb40fa8db",
8256
            "401d9fb01f054e6aaaf62b1546ab7686",
8257
            "9f6d67cf6b9748288044a8c7a98cc2e3",
8258
            "05c1e6ba7977465092a69324888cf59e",
8259
            "26073e1c5d284656be9c5fdb55276a25",
8260
            "51b1646d7e194c75b1109d16b8291c76",
8261
            "3efa5c88dc2d491c99678d73e4144eeb",
8262
            "b1dfa66aec6a4e86bff78e3a62905a3c",
8263
            "5e4cc08b7aa44cacae18fcc4131c174d",
8264
            "813d16aa8a144cf7b3c1b08d096a2b20",
8265
            "63c15146f75f473394ebcc165ca0d7f6",
8266
            "cc10d97351604ee18918afa1d955a089",
8267
            "6ff94a654ed54915b2082197920e89ab",
8268
            "dc9118ad41d247cab135811a183805e8",
8269
            "3e285ebb0b7d414fb5ab6ee02ccb4f50",
8270
            "ae75d86eb24241d082669a422df4180c",
8271
            "f8e648aa342c43aa9e960622f897e5c5",
8272
            "12051bdac0aa466c91122f3cb0e1ab2b",
8273
            "e9569646ef72451496087c49a2487ddc",
8274
            "23fc55e87153404d90f55930f7f73988",
8275
            "903957b2c1404703b2e59a2875da77ec",
8276
            "cfbb97be5d284781b35abeca297bbad9",
8277
            "ab04ee5ca65f45fc9368a80847926198",
8278
            "0fd23d208e5942439a7e83797ac9fe64",
8279
            "e1da3e30982746959ec7ebd180a3bbb9",
8280
            "0836d18df07244afb40d2cc2f6a3879e",
8281
            "79189477733f4aff8e62c4cbf318e91b",
8282
            "4a4d70a7a8dd4af4b3147161193b1885",
8283
            "b72edebfa2a548b49c47bad5bc7aeecd"
8284
          ]
8285
        },
8286
        "id": "UaOS8pYMyg53",
8287
        "outputId": "28ca11bc-ef21-4bdf-f982-485b431cd21f"
8288
      },
8289
      "execution_count": null,
8290
      "outputs": [
8291
        {
8292
          "output_type": "stream",
8293
          "name": "stdout",
8294
          "text": [
8295
            "\u001b[?25l     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/302.0 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K     \u001b[91m━━━━━━━━━━━━━━━━\u001b[0m\u001b[90m╺\u001b[0m\u001b[90m━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m122.9/302.0 kB\u001b[0m \u001b[31m3.6 MB/s\u001b[0m eta \u001b[36m0:00:01\u001b[0m\r\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m302.0/302.0 kB\u001b[0m \u001b[31m5.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
8296
            "\u001b[?25h"
8297
          ]
8298
        },
8299
        {
8300
          "output_type": "display_data",
8301
          "data": {
8302
            "text/plain": [
8303
              "VBox(children=(HTML(value='<center> <img\\nsrc=https://huggingface.co/front/assets/huggingface_logo-noborder.sv…"
8304
            ],
8305
            "application/vnd.jupyter.widget-view+json": {
8306
              "version_major": 2,
8307
              "version_minor": 0,
8308
              "model_id": "da62083d1a3d4d62b76a92abec717a24"
8309
            }
8310
          },
8311
          "metadata": {}
8312
        }
8313
      ]
8314
    },
8315
    {
8316
      "cell_type": "code",
8317
      "source": [
8318
        "api.create_repo(\n",
8319
        "    repo_id=f\"mlabonne/{MODEL_NAME}-{BPW:.1f}bpw-exl2\",\n",
8320
        "    repo_type=\"model\"\n",
8321
        ")\n",
8322
        "api.upload_folder(\n",
8323
        "    repo_id=f\"mlabonne/{MODEL_NAME}-{BPW:.1f}bpw-exl2\",\n",
8324
        "    folder_path=\"quant\",\n",
8325
        ")"
8326
      ],
8327
      "metadata": {
8328
        "colab": {
8329
          "base_uri": "https://localhost:8080/",
8330
          "height": 227,
8331
          "referenced_widgets": [
8332
            "98916f7a1809458e8ebc568f770ed544",
8333
            "2c6ba20e4b384d6fa46fbd832daf36e2",
8334
            "a6920b63b1cb4c1297bc5a18c7e30f7e",
8335
            "c18e0920993f4189ab927b167fb9a046",
8336
            "13565f1b6e6e4fa7a365160dad1cdb42",
8337
            "fa3308e0b8fb469d8549199e8bfe2278",
8338
            "e7672f0406bd4f2c8a0ef83fd390e49d",
8339
            "22b9c33a7c084ccd9e8878bda3748486",
8340
            "2d6aa1ecdf7444b4b4cb81515d3654be",
8341
            "6cedbad90ca9423f85a48d7e4073a378",
8342
            "c893eb5da4e34e4999981b3810a4205b",
8343
            "2a5efce36f38406189e82e2e27b06bab",
8344
            "3c828089249743e6aa4f3ee60f77caee",
8345
            "543b02a2098043ca849ecdda4f4c7a81",
8346
            "9b076b5c6cf74e56abb01cbcb59d1deb",
8347
            "ac08f05888c64726aabcb9a1cfd65aba",
8348
            "4f48b906c779402187567aad8b4ba488",
8349
            "e004498b56524804b28661cde5fdce81",
8350
            "9931d545676d49039aba007f13904155",
8351
            "130049623d6744dcac8a7ffa25e1e1d1",
8352
            "f48ddd7d4d304e10b3fabc3cdc541dbf",
8353
            "bcdd93e578fd49e8b1bb76f43bde3483",
8354
            "a051f03b2e8340dea8b8d8f0389f1d76",
8355
            "17c15d87496d4e5ea25814806b8606ea",
8356
            "71093ecee7ac45798d8bcb924af2906c",
8357
            "5a0d9471e6cd4f2988f042c4a4e48a3d",
8358
            "841d7197d6324552a0fbb6d6f5ac7601",
8359
            "3c3d9d10ee9e466ba170b3dd3aa3ecdd",
8360
            "fa9d061965d74d0eb6d728c1f4058845",
8361
            "62de7ed888614d26875a0ecd99cb996f",
8362
            "89dc60db3b9a4a1587b00130ffde2311",
8363
            "9d0851b2c54c4e5cb635cd2652890824",
8364
            "7a89919a4de9454aa8a7c134f1b1fa3d",
8365
            "30fb290999b84d9eb69b8dd720c534b5",
8366
            "37a67b2e108248858858b72cf2d00aba",
8367
            "a038d308888c40bca1cc45c962344ec6",
8368
            "70bd55b8cd2f42d6b9ecd76c17972771",
8369
            "e18504b6c48a45ef8abe75f2d59147ea",
8370
            "b8e8032b75cf4b1eadfe76395f8811ac",
8371
            "dd6c2ab6494c48878a7521c0fc0e2109",
8372
            "6e98141655cc48d48f47f3981fb385e6",
8373
            "fbf6c4c6ed85465095eb3ae986994c69",
8374
            "95addcc750ad45ecbc37c5c7f463d812",
8375
            "0e8403a6428b4387a1ebbdecf7c7aa03",
8376
            "945dffb008b44010807bf11ae1dbfec2",
8377
            "9a28c85b06bc49ce9c36534766b7650f",
8378
            "46964345de59401ab8bc5f51dcfa94fd",
8379
            "60b0f63948dd47fcb6d8aaab5bfedf5c",
8380
            "edc938cff4ec477b92ecb768f3ab2fab",
8381
            "7d3c1a673c614c819f5b83b8d9fb61ef",
8382
            "7a8b92bd2ea34c2181f6dcaaea9c5dee",
8383
            "6f83a7cd4e664e8aaf847196344d1256",
8384
            "145c52ca456d4052af8b458578858176",
8385
            "b3d7552080874350a3688dab8838452c",
8386
            "63e84ef3cff94a929602b8b419cd8071",
8387
            "55b59177fdb6441ba564d5f3f5dfa422",
8388
            "52d6cbef58b947119609460d41917399",
8389
            "264f7e06376748dda35453413b382949",
8390
            "1b84d95ea138413d8d8d1ea997741f86",
8391
            "8f581db41cd54f89a81f8424042190cf",
8392
            "15ca60c283cb4fa389ed92e9433af851",
8393
            "ee220712a2e0467a8d07c473749a958c",
8394
            "689c0aca3273499e820bad016d3ccaa9",
8395
            "a2096f9286ab486e9baad9f349a23a95",
8396
            "1bcc515d9d764c908af2988e29eaeeed",
8397
            "ca437b02cab741489217ad4d8780f728"
8398
          ]
8399
        },
8400
        "id": "e8XNlABEeebe",
8401
        "outputId": "a0f9b2bb-6c5d-4d7e-a0a6-aaf0dc73fbed"
8402
      },
8403
      "execution_count": null,
8404
      "outputs": [
8405
        {
8406
          "output_type": "display_data",
8407
          "data": {
8408
            "text/plain": [
8409
              "cal_data.safetensors:   0%|          | 0.00/1.64M [00:00<?, ?B/s]"
8410
            ],
8411
            "application/vnd.jupyter.widget-view+json": {
8412
              "version_major": 2,
8413
              "version_minor": 0,
8414
              "model_id": "98916f7a1809458e8ebc568f770ed544"
8415
            }
8416
          },
8417
          "metadata": {}
8418
        },
8419
        {
8420
          "output_type": "display_data",
8421
          "data": {
8422
            "text/plain": [
8423
              "output.safetensors:   0%|          | 0.00/4.74G [00:00<?, ?B/s]"
8424
            ],
8425
            "application/vnd.jupyter.widget-view+json": {
8426
              "version_major": 2,
8427
              "version_minor": 0,
8428
              "model_id": "2a5efce36f38406189e82e2e27b06bab"
8429
            }
8430
          },
8431
          "metadata": {}
8432
        },
8433
        {
8434
          "output_type": "display_data",
8435
          "data": {
8436
            "text/plain": [
8437
              "Upload 5 LFS files:   0%|          | 0/5 [00:00<?, ?it/s]"
8438
            ],
8439
            "application/vnd.jupyter.widget-view+json": {
8440
              "version_major": 2,
8441
              "version_minor": 0,
8442
              "model_id": "a051f03b2e8340dea8b8d8f0389f1d76"
8443
            }
8444
          },
8445
          "metadata": {}
8446
        },
8447
        {
8448
          "output_type": "display_data",
8449
          "data": {
8450
            "text/plain": [
8451
              "input_states.safetensors:   0%|          | 0.00/1.68G [00:00<?, ?B/s]"
8452
            ],
8453
            "application/vnd.jupyter.widget-view+json": {
8454
              "version_major": 2,
8455
              "version_minor": 0,
8456
              "model_id": "30fb290999b84d9eb69b8dd720c534b5"
8457
            }
8458
          },
8459
          "metadata": {}
8460
        },
8461
        {
8462
          "output_type": "display_data",
8463
          "data": {
8464
            "text/plain": [
8465
              "training_args.bin:   0%|          | 0.00/5.43k [00:00<?, ?B/s]"
8466
            ],
8467
            "application/vnd.jupyter.widget-view+json": {
8468
              "version_major": 2,
8469
              "version_minor": 0,
8470
              "model_id": "945dffb008b44010807bf11ae1dbfec2"
8471
            }
8472
          },
8473
          "metadata": {}
8474
        },
8475
        {
8476
          "output_type": "display_data",
8477
          "data": {
8478
            "text/plain": [
8479
              "tokenizer.model:   0%|          | 0.00/493k [00:00<?, ?B/s]"
8480
            ],
8481
            "application/vnd.jupyter.widget-view+json": {
8482
              "version_major": 2,
8483
              "version_minor": 0,
8484
              "model_id": "55b59177fdb6441ba564d5f3f5dfa422"
8485
            }
8486
          },
8487
          "metadata": {}
8488
        },
8489
        {
8490
          "output_type": "execute_result",
8491
          "data": {
8492
            "text/plain": [
8493
              "'https://huggingface.co/mlabonne/zephyr-7b-beta-5.0bpw-exl2/tree/main/'"
8494
            ],
8495
            "application/vnd.google.colaboratory.intrinsic+json": {
8496
              "type": "string"
8497
            }
8498
          },
8499
          "metadata": {},
8500
          "execution_count": 8
8501
        }
8502
      ]
8503
    }
8504
  ]
8505
}

Использование cookies

Мы используем файлы cookie в соответствии с Политикой конфиденциальности и Политикой использования cookies.

Нажимая кнопку «Принимаю», Вы даете АО «СберТех» согласие на обработку Ваших персональных данных в целях совершенствования нашего веб-сайта и Сервиса GitVerse, а также повышения удобства их использования.

Запретить использование cookies Вы можете самостоятельно в настройках Вашего браузера.