codeShare commited on
Commit
b5d655d
·
verified ·
1 Parent(s): 17791c8

Upload create_hidream_sdnq.ipynb

Browse files
colab_notebooks/create_hidream_sdnq.ipynb CHANGED
@@ -2752,7 +2752,7 @@
2752
  "description_width": ""
2753
  }
2754
  },
2755
- "db161b32e9274be58b559b187b6d292a": {
2756
  "model_module": "@jupyter-widgets/controls",
2757
  "model_name": "HBoxModel",
2758
  "model_module_version": "1.5.0",
@@ -2767,14 +2767,14 @@
2767
  "_view_name": "HBoxView",
2768
  "box_style": "",
2769
  "children": [
2770
- "IPY_MODEL_f7b656d8f6db48a4b2186383cbc84b29",
2771
- "IPY_MODEL_4e828087d74f430ab772b462790a8903",
2772
- "IPY_MODEL_53631f8fedcd4c5b8a4f5dc5768292c5"
2773
  ],
2774
- "layout": "IPY_MODEL_b8e2f351331041f6bab1eeacf953a2b0"
2775
  }
2776
  },
2777
- "f7b656d8f6db48a4b2186383cbc84b29": {
2778
  "model_module": "@jupyter-widgets/controls",
2779
  "model_name": "HTMLModel",
2780
  "model_module_version": "1.5.0",
@@ -2789,13 +2789,13 @@
2789
  "_view_name": "HTMLView",
2790
  "description": "",
2791
  "description_tooltip": null,
2792
- "layout": "IPY_MODEL_3cbf7135fc77424aaa12cb2c5be57743",
2793
  "placeholder": "​",
2794
- "style": "IPY_MODEL_a2d41db1f50f4714bbe2a058b7edccaf",
2795
- "value": "Fetching 7 files:  14%"
2796
  }
2797
  },
2798
- "4e828087d74f430ab772b462790a8903": {
2799
  "model_module": "@jupyter-widgets/controls",
2800
  "model_name": "FloatProgressModel",
2801
  "model_module_version": "1.5.0",
@@ -2808,18 +2808,18 @@
2808
  "_view_module": "@jupyter-widgets/controls",
2809
  "_view_module_version": "1.5.0",
2810
  "_view_name": "ProgressView",
2811
- "bar_style": "",
2812
  "description": "",
2813
  "description_tooltip": null,
2814
- "layout": "IPY_MODEL_a49f9939455349dda171ba76ac1fa329",
2815
- "max": 7,
2816
  "min": 0,
2817
  "orientation": "horizontal",
2818
- "style": "IPY_MODEL_0508252a7b894233837b0a7fcb57d151",
2819
- "value": 1
2820
  }
2821
  },
2822
- "53631f8fedcd4c5b8a4f5dc5768292c5": {
2823
  "model_module": "@jupyter-widgets/controls",
2824
  "model_name": "HTMLModel",
2825
  "model_module_version": "1.5.0",
@@ -2834,13 +2834,13 @@
2834
  "_view_name": "HTMLView",
2835
  "description": "",
2836
  "description_tooltip": null,
2837
- "layout": "IPY_MODEL_53ef4ff9f2ba4e528e8e59f46b935044",
2838
  "placeholder": "​",
2839
- "style": "IPY_MODEL_c44afc7fe718421bbc8617d24c56593c",
2840
- "value": " 1/7 [00:00<00:05,  1.16it/s]"
2841
  }
2842
  },
2843
- "b8e2f351331041f6bab1eeacf953a2b0": {
2844
  "model_module": "@jupyter-widgets/base",
2845
  "model_name": "LayoutModel",
2846
  "model_module_version": "1.2.0",
@@ -2892,7 +2892,7 @@
2892
  "width": null
2893
  }
2894
  },
2895
- "3cbf7135fc77424aaa12cb2c5be57743": {
2896
  "model_module": "@jupyter-widgets/base",
2897
  "model_name": "LayoutModel",
2898
  "model_module_version": "1.2.0",
@@ -2944,7 +2944,7 @@
2944
  "width": null
2945
  }
2946
  },
2947
- "a2d41db1f50f4714bbe2a058b7edccaf": {
2948
  "model_module": "@jupyter-widgets/controls",
2949
  "model_name": "DescriptionStyleModel",
2950
  "model_module_version": "1.5.0",
@@ -2959,7 +2959,7 @@
2959
  "description_width": ""
2960
  }
2961
  },
2962
- "a49f9939455349dda171ba76ac1fa329": {
2963
  "model_module": "@jupyter-widgets/base",
2964
  "model_name": "LayoutModel",
2965
  "model_module_version": "1.2.0",
@@ -3011,7 +3011,7 @@
3011
  "width": null
3012
  }
3013
  },
3014
- "0508252a7b894233837b0a7fcb57d151": {
3015
  "model_module": "@jupyter-widgets/controls",
3016
  "model_name": "ProgressStyleModel",
3017
  "model_module_version": "1.5.0",
@@ -3027,7 +3027,7 @@
3027
  "description_width": ""
3028
  }
3029
  },
3030
- "53ef4ff9f2ba4e528e8e59f46b935044": {
3031
  "model_module": "@jupyter-widgets/base",
3032
  "model_name": "LayoutModel",
3033
  "model_module_version": "1.2.0",
@@ -3079,7 +3079,7 @@
3079
  "width": null
3080
  }
3081
  },
3082
- "c44afc7fe718421bbc8617d24c56593c": {
3083
  "model_module": "@jupyter-widgets/controls",
3084
  "model_name": "DescriptionStyleModel",
3085
  "model_module_version": "1.5.0",
@@ -3094,7 +3094,7 @@
3094
  "description_width": ""
3095
  }
3096
  },
3097
- "46453419213a433cb3ed6fe07ba5843d": {
3098
  "model_module": "@jupyter-widgets/controls",
3099
  "model_name": "HBoxModel",
3100
  "model_module_version": "1.5.0",
@@ -3109,14 +3109,14 @@
3109
  "_view_name": "HBoxView",
3110
  "box_style": "",
3111
  "children": [
3112
- "IPY_MODEL_b6d930a1703d4527b2c327cd5e19d676",
3113
- "IPY_MODEL_985ea6752ec84b76853dd5d05d567f82",
3114
- "IPY_MODEL_86316cfe458c46fdbb868fefcec4f4f5"
3115
  ],
3116
- "layout": "IPY_MODEL_9f24ffe2990844b989ed559e74f99054"
3117
  }
3118
  },
3119
- "b6d930a1703d4527b2c327cd5e19d676": {
3120
  "model_module": "@jupyter-widgets/controls",
3121
  "model_name": "HTMLModel",
3122
  "model_module_version": "1.5.0",
@@ -3131,13 +3131,13 @@
3131
  "_view_name": "HTMLView",
3132
  "description": "",
3133
  "description_tooltip": null,
3134
- "layout": "IPY_MODEL_91d368dd1b7b4f0e8c5270e4eb04ac5e",
3135
  "placeholder": "​",
3136
- "style": "IPY_MODEL_d6fbd58fae1b4aa7b93146d787ef7a32",
3137
- "value": "model-00002-of-00003.safetensors:  35%"
3138
  }
3139
  },
3140
- "985ea6752ec84b76853dd5d05d567f82": {
3141
  "model_module": "@jupyter-widgets/controls",
3142
  "model_name": "FloatProgressModel",
3143
  "model_module_version": "1.5.0",
@@ -3150,18 +3150,18 @@
3150
  "_view_module": "@jupyter-widgets/controls",
3151
  "_view_module_version": "1.5.0",
3152
  "_view_name": "ProgressView",
3153
- "bar_style": "",
3154
  "description": "",
3155
  "description_tooltip": null,
3156
- "layout": "IPY_MODEL_bf9a903226cf45d9b28cfd011530b936",
3157
- "max": 4338534096,
3158
  "min": 0,
3159
  "orientation": "horizontal",
3160
- "style": "IPY_MODEL_e15742f1f0444e719d2b5c4f38af5451",
3161
- "value": 1509052439
3162
  }
3163
  },
3164
- "86316cfe458c46fdbb868fefcec4f4f5": {
3165
  "model_module": "@jupyter-widgets/controls",
3166
  "model_name": "HTMLModel",
3167
  "model_module_version": "1.5.0",
@@ -3176,13 +3176,13 @@
3176
  "_view_name": "HTMLView",
3177
  "description": "",
3178
  "description_tooltip": null,
3179
- "layout": "IPY_MODEL_a25e978eb8954cc7a90d98cb5e354e24",
3180
  "placeholder": "​",
3181
- "style": "IPY_MODEL_3ff784a2667f419297fde5e70b6cca5b",
3182
- "value": " 1.51G/4.34G [00:49<00:39, 71.3MB/s]"
3183
  }
3184
  },
3185
- "9f24ffe2990844b989ed559e74f99054": {
3186
  "model_module": "@jupyter-widgets/base",
3187
  "model_name": "LayoutModel",
3188
  "model_module_version": "1.2.0",
@@ -3234,7 +3234,7 @@
3234
  "width": null
3235
  }
3236
  },
3237
- "91d368dd1b7b4f0e8c5270e4eb04ac5e": {
3238
  "model_module": "@jupyter-widgets/base",
3239
  "model_name": "LayoutModel",
3240
  "model_module_version": "1.2.0",
@@ -3286,7 +3286,7 @@
3286
  "width": null
3287
  }
3288
  },
3289
- "d6fbd58fae1b4aa7b93146d787ef7a32": {
3290
  "model_module": "@jupyter-widgets/controls",
3291
  "model_name": "DescriptionStyleModel",
3292
  "model_module_version": "1.5.0",
@@ -3301,7 +3301,7 @@
3301
  "description_width": ""
3302
  }
3303
  },
3304
- "bf9a903226cf45d9b28cfd011530b936": {
3305
  "model_module": "@jupyter-widgets/base",
3306
  "model_name": "LayoutModel",
3307
  "model_module_version": "1.2.0",
@@ -3350,10 +3350,10 @@
3350
  "right": null,
3351
  "top": null,
3352
  "visibility": null,
3353
- "width": null
3354
  }
3355
  },
3356
- "e15742f1f0444e719d2b5c4f38af5451": {
3357
  "model_module": "@jupyter-widgets/controls",
3358
  "model_name": "ProgressStyleModel",
3359
  "model_module_version": "1.5.0",
@@ -3369,7 +3369,7 @@
3369
  "description_width": ""
3370
  }
3371
  },
3372
- "a25e978eb8954cc7a90d98cb5e354e24": {
3373
  "model_module": "@jupyter-widgets/base",
3374
  "model_name": "LayoutModel",
3375
  "model_module_version": "1.2.0",
@@ -3421,7 +3421,7 @@
3421
  "width": null
3422
  }
3423
  },
3424
- "3ff784a2667f419297fde5e70b6cca5b": {
3425
  "model_module": "@jupyter-widgets/controls",
3426
  "model_name": "DescriptionStyleModel",
3427
  "model_module_version": "1.5.0",
@@ -3436,7 +3436,7 @@
3436
  "description_width": ""
3437
  }
3438
  },
3439
- "12d20ba2e2024f69af3b65799894601b": {
3440
  "model_module": "@jupyter-widgets/controls",
3441
  "model_name": "HBoxModel",
3442
  "model_module_version": "1.5.0",
@@ -3451,14 +3451,14 @@
3451
  "_view_name": "HBoxView",
3452
  "box_style": "",
3453
  "children": [
3454
- "IPY_MODEL_0303cb9e444e447d8d03500004ab2718",
3455
- "IPY_MODEL_efefeea7943c43de8e663642df8cf1ac",
3456
- "IPY_MODEL_69945a2d9e054d549de35fcf5caf7c6d"
3457
  ],
3458
- "layout": "IPY_MODEL_126fb6973fea44cda0a9f5cab4744178"
3459
  }
3460
  },
3461
- "0303cb9e444e447d8d03500004ab2718": {
3462
  "model_module": "@jupyter-widgets/controls",
3463
  "model_name": "HTMLModel",
3464
  "model_module_version": "1.5.0",
@@ -3473,13 +3473,13 @@
3473
  "_view_name": "HTMLView",
3474
  "description": "",
3475
  "description_tooltip": null,
3476
- "layout": "IPY_MODEL_7df1bad71f074099bfe79851f64ae2f2",
3477
  "placeholder": "​",
3478
- "style": "IPY_MODEL_da1342b9ae4c44f89a8f776e3695058f",
3479
- "value": "model-00003-of-00003.safetensors:  72%"
3480
  }
3481
  },
3482
- "efefeea7943c43de8e663642df8cf1ac": {
3483
  "model_module": "@jupyter-widgets/controls",
3484
  "model_name": "FloatProgressModel",
3485
  "model_module_version": "1.5.0",
@@ -3492,18 +3492,18 @@
3492
  "_view_module": "@jupyter-widgets/controls",
3493
  "_view_module_version": "1.5.0",
3494
  "_view_name": "ProgressView",
3495
- "bar_style": "",
3496
  "description": "",
3497
  "description_tooltip": null,
3498
- "layout": "IPY_MODEL_0b6b8be2864a459780b865cb2a06db1d",
3499
- "max": 2489319552,
3500
  "min": 0,
3501
  "orientation": "horizontal",
3502
- "style": "IPY_MODEL_423c6c5fbd2f4d46b139251b86a29816",
3503
- "value": 1791035173
3504
  }
3505
  },
3506
- "69945a2d9e054d549de35fcf5caf7c6d": {
3507
  "model_module": "@jupyter-widgets/controls",
3508
  "model_name": "HTMLModel",
3509
  "model_module_version": "1.5.0",
@@ -3518,13 +3518,13 @@
3518
  "_view_name": "HTMLView",
3519
  "description": "",
3520
  "description_tooltip": null,
3521
- "layout": "IPY_MODEL_1f408f5f289e4641891334ca973c8fc7",
3522
  "placeholder": "​",
3523
- "style": "IPY_MODEL_a90e33f62cc54ace808528591952b422",
3524
- "value": " 1.79G/2.49G [01:41<00:45, 15.5MB/s]"
3525
  }
3526
  },
3527
- "126fb6973fea44cda0a9f5cab4744178": {
3528
  "model_module": "@jupyter-widgets/base",
3529
  "model_name": "LayoutModel",
3530
  "model_module_version": "1.2.0",
@@ -3576,7 +3576,7 @@
3576
  "width": null
3577
  }
3578
  },
3579
- "7df1bad71f074099bfe79851f64ae2f2": {
3580
  "model_module": "@jupyter-widgets/base",
3581
  "model_name": "LayoutModel",
3582
  "model_module_version": "1.2.0",
@@ -3628,7 +3628,7 @@
3628
  "width": null
3629
  }
3630
  },
3631
- "da1342b9ae4c44f89a8f776e3695058f": {
3632
  "model_module": "@jupyter-widgets/controls",
3633
  "model_name": "DescriptionStyleModel",
3634
  "model_module_version": "1.5.0",
@@ -3643,7 +3643,7 @@
3643
  "description_width": ""
3644
  }
3645
  },
3646
- "0b6b8be2864a459780b865cb2a06db1d": {
3647
  "model_module": "@jupyter-widgets/base",
3648
  "model_name": "LayoutModel",
3649
  "model_module_version": "1.2.0",
@@ -3692,10 +3692,10 @@
3692
  "right": null,
3693
  "top": null,
3694
  "visibility": null,
3695
- "width": null
3696
  }
3697
  },
3698
- "423c6c5fbd2f4d46b139251b86a29816": {
3699
  "model_module": "@jupyter-widgets/controls",
3700
  "model_name": "ProgressStyleModel",
3701
  "model_module_version": "1.5.0",
@@ -3711,7 +3711,7 @@
3711
  "description_width": ""
3712
  }
3713
  },
3714
- "1f408f5f289e4641891334ca973c8fc7": {
3715
  "model_module": "@jupyter-widgets/base",
3716
  "model_name": "LayoutModel",
3717
  "model_module_version": "1.2.0",
@@ -3763,7 +3763,7 @@
3763
  "width": null
3764
  }
3765
  },
3766
- "a90e33f62cc54ace808528591952b422": {
3767
  "model_module": "@jupyter-widgets/controls",
3768
  "model_name": "DescriptionStyleModel",
3769
  "model_module_version": "1.5.0",
@@ -3778,7 +3778,7 @@
3778
  "description_width": ""
3779
  }
3780
  },
3781
- "c0f9d65172b848e291ea17a1da321f3c": {
3782
  "model_module": "@jupyter-widgets/controls",
3783
  "model_name": "HBoxModel",
3784
  "model_module_version": "1.5.0",
@@ -3793,14 +3793,14 @@
3793
  "_view_name": "HBoxView",
3794
  "box_style": "",
3795
  "children": [
3796
- "IPY_MODEL_b9c367da4a89412391730169acbbdd35",
3797
- "IPY_MODEL_fdc38ba47f7a4d80abc884ca816c363d",
3798
- "IPY_MODEL_523f648751014635b52f2d4336f4f7d6"
3799
  ],
3800
- "layout": "IPY_MODEL_f51bc80160e04634996df2f7c5148c3d"
3801
  }
3802
  },
3803
- "b9c367da4a89412391730169acbbdd35": {
3804
  "model_module": "@jupyter-widgets/controls",
3805
  "model_name": "HTMLModel",
3806
  "model_module_version": "1.5.0",
@@ -3815,13 +3815,13 @@
3815
  "_view_name": "HTMLView",
3816
  "description": "",
3817
  "description_tooltip": null,
3818
- "layout": "IPY_MODEL_34923048e59a4b5aa0743c96493efa51",
3819
  "placeholder": "​",
3820
- "style": "IPY_MODEL_1bdebdcdaf1843e3aac80469c9337a51",
3821
- "value": "model-00001-of-00003.safetensors:  46%"
3822
  }
3823
  },
3824
- "fdc38ba47f7a4d80abc884ca816c363d": {
3825
  "model_module": "@jupyter-widgets/controls",
3826
  "model_name": "FloatProgressModel",
3827
  "model_module_version": "1.5.0",
@@ -3834,18 +3834,18 @@
3834
  "_view_module": "@jupyter-widgets/controls",
3835
  "_view_module_version": "1.5.0",
3836
  "_view_name": "ProgressView",
3837
- "bar_style": "",
3838
  "description": "",
3839
  "description_tooltip": null,
3840
- "layout": "IPY_MODEL_881ffafb32834aeb8bf91870af7c3a42",
3841
- "max": 4999690416,
3842
  "min": 0,
3843
  "orientation": "horizontal",
3844
- "style": "IPY_MODEL_a547f15f1354431c8542fe0d69326dba",
3845
- "value": 2294388491
3846
  }
3847
  },
3848
- "523f648751014635b52f2d4336f4f7d6": {
3849
  "model_module": "@jupyter-widgets/controls",
3850
  "model_name": "HTMLModel",
3851
  "model_module_version": "1.5.0",
@@ -3860,13 +3860,13 @@
3860
  "_view_name": "HTMLView",
3861
  "description": "",
3862
  "description_tooltip": null,
3863
- "layout": "IPY_MODEL_90220217245745bca53a2151e3b1933c",
3864
  "placeholder": "​",
3865
- "style": "IPY_MODEL_2b0d09f6e6b9414c9c0ab489077de0f0",
3866
- "value": " 2.29G/5.00G [01:42<03:07, 14.4MB/s]"
3867
  }
3868
  },
3869
- "f51bc80160e04634996df2f7c5148c3d": {
3870
  "model_module": "@jupyter-widgets/base",
3871
  "model_name": "LayoutModel",
3872
  "model_module_version": "1.2.0",
@@ -3918,7 +3918,7 @@
3918
  "width": null
3919
  }
3920
  },
3921
- "34923048e59a4b5aa0743c96493efa51": {
3922
  "model_module": "@jupyter-widgets/base",
3923
  "model_name": "LayoutModel",
3924
  "model_module_version": "1.2.0",
@@ -3970,7 +3970,7 @@
3970
  "width": null
3971
  }
3972
  },
3973
- "1bdebdcdaf1843e3aac80469c9337a51": {
3974
  "model_module": "@jupyter-widgets/controls",
3975
  "model_name": "DescriptionStyleModel",
3976
  "model_module_version": "1.5.0",
@@ -3985,7 +3985,7 @@
3985
  "description_width": ""
3986
  }
3987
  },
3988
- "881ffafb32834aeb8bf91870af7c3a42": {
3989
  "model_module": "@jupyter-widgets/base",
3990
  "model_name": "LayoutModel",
3991
  "model_module_version": "1.2.0",
@@ -4037,7 +4037,7 @@
4037
  "width": null
4038
  }
4039
  },
4040
- "a547f15f1354431c8542fe0d69326dba": {
4041
  "model_module": "@jupyter-widgets/controls",
4042
  "model_name": "ProgressStyleModel",
4043
  "model_module_version": "1.5.0",
@@ -4053,7 +4053,7 @@
4053
  "description_width": ""
4054
  }
4055
  },
4056
- "90220217245745bca53a2151e3b1933c": {
4057
  "model_module": "@jupyter-widgets/base",
4058
  "model_name": "LayoutModel",
4059
  "model_module_version": "1.2.0",
@@ -4105,7 +4105,7 @@
4105
  "width": null
4106
  }
4107
  },
4108
- "2b0d09f6e6b9414c9c0ab489077de0f0": {
4109
  "model_module": "@jupyter-widgets/controls",
4110
  "model_name": "DescriptionStyleModel",
4111
  "model_module_version": "1.5.0",
@@ -4120,7 +4120,7 @@
4120
  "description_width": ""
4121
  }
4122
  },
4123
- "4b6d4113ffba46d5a7690d762ea224ef": {
4124
  "model_module": "@jupyter-widgets/controls",
4125
  "model_name": "HBoxModel",
4126
  "model_module_version": "1.5.0",
@@ -4135,14 +4135,14 @@
4135
  "_view_name": "HBoxView",
4136
  "box_style": "",
4137
  "children": [
4138
- "IPY_MODEL_9b5ae64e7bc24bd2bbe62c7f224784c7",
4139
- "IPY_MODEL_d38a6f02f4d24f2e81cc6e025b02d87b",
4140
- "IPY_MODEL_3bc56673e3a64423b065f4cb76af047b"
4141
  ],
4142
- "layout": "IPY_MODEL_2e016f49b4844cf7b8d0e832d6ba4f89"
4143
  }
4144
  },
4145
- "9b5ae64e7bc24bd2bbe62c7f224784c7": {
4146
  "model_module": "@jupyter-widgets/controls",
4147
  "model_name": "HTMLModel",
4148
  "model_module_version": "1.5.0",
@@ -4157,13 +4157,13 @@
4157
  "_view_name": "HTMLView",
4158
  "description": "",
4159
  "description_tooltip": null,
4160
- "layout": "IPY_MODEL_16dd315649094a63bfc5853276fe77d4",
4161
  "placeholder": "​",
4162
- "style": "IPY_MODEL_20abd42995f8458d8be78bc79ea33a25",
4163
- "value": "generation_config.json: 100%"
4164
  }
4165
  },
4166
- "d38a6f02f4d24f2e81cc6e025b02d87b": {
4167
  "model_module": "@jupyter-widgets/controls",
4168
  "model_name": "FloatProgressModel",
4169
  "model_module_version": "1.5.0",
@@ -4179,15 +4179,15 @@
4179
  "bar_style": "success",
4180
  "description": "",
4181
  "description_tooltip": null,
4182
- "layout": "IPY_MODEL_d191833b275b404d85ae6930ed2a0f65",
4183
- "max": 213,
4184
  "min": 0,
4185
  "orientation": "horizontal",
4186
- "style": "IPY_MODEL_17013d0d78214f3199cf75c86b25d945",
4187
- "value": 213
4188
  }
4189
  },
4190
- "3bc56673e3a64423b065f4cb76af047b": {
4191
  "model_module": "@jupyter-widgets/controls",
4192
  "model_name": "HTMLModel",
4193
  "model_module_version": "1.5.0",
@@ -4202,13 +4202,13 @@
4202
  "_view_name": "HTMLView",
4203
  "description": "",
4204
  "description_tooltip": null,
4205
- "layout": "IPY_MODEL_5a3b2deebaab4445acd0bd7454d84da9",
4206
  "placeholder": "​",
4207
- "style": "IPY_MODEL_80e6ba82a36744d48d2a966e07fcfa75",
4208
- "value": " 213/213 [00:00<00:00, 12.5kB/s]"
4209
  }
4210
  },
4211
- "2e016f49b4844cf7b8d0e832d6ba4f89": {
4212
  "model_module": "@jupyter-widgets/base",
4213
  "model_name": "LayoutModel",
4214
  "model_module_version": "1.2.0",
@@ -4260,7 +4260,7 @@
4260
  "width": null
4261
  }
4262
  },
4263
- "16dd315649094a63bfc5853276fe77d4": {
4264
  "model_module": "@jupyter-widgets/base",
4265
  "model_name": "LayoutModel",
4266
  "model_module_version": "1.2.0",
@@ -4312,7 +4312,7 @@
4312
  "width": null
4313
  }
4314
  },
4315
- "20abd42995f8458d8be78bc79ea33a25": {
4316
  "model_module": "@jupyter-widgets/controls",
4317
  "model_name": "DescriptionStyleModel",
4318
  "model_module_version": "1.5.0",
@@ -4327,7 +4327,7 @@
4327
  "description_width": ""
4328
  }
4329
  },
4330
- "d191833b275b404d85ae6930ed2a0f65": {
4331
  "model_module": "@jupyter-widgets/base",
4332
  "model_name": "LayoutModel",
4333
  "model_module_version": "1.2.0",
@@ -4379,7 +4379,7 @@
4379
  "width": null
4380
  }
4381
  },
4382
- "17013d0d78214f3199cf75c86b25d945": {
4383
  "model_module": "@jupyter-widgets/controls",
4384
  "model_name": "ProgressStyleModel",
4385
  "model_module_version": "1.5.0",
@@ -4395,7 +4395,7 @@
4395
  "description_width": ""
4396
  }
4397
  },
4398
- "5a3b2deebaab4445acd0bd7454d84da9": {
4399
  "model_module": "@jupyter-widgets/base",
4400
  "model_name": "LayoutModel",
4401
  "model_module_version": "1.2.0",
@@ -4447,7 +4447,7 @@
4447
  "width": null
4448
  }
4449
  },
4450
- "80e6ba82a36744d48d2a966e07fcfa75": {
4451
  "model_module": "@jupyter-widgets/controls",
4452
  "model_name": "DescriptionStyleModel",
4453
  "model_module_version": "1.5.0",
@@ -4462,7 +4462,7 @@
4462
  "description_width": ""
4463
  }
4464
  },
4465
- "0c272deca15c438c95eb50401e2239c2": {
4466
  "model_module": "@jupyter-widgets/controls",
4467
  "model_name": "HBoxModel",
4468
  "model_module_version": "1.5.0",
@@ -4477,14 +4477,14 @@
4477
  "_view_name": "HBoxView",
4478
  "box_style": "",
4479
  "children": [
4480
- "IPY_MODEL_e8bf0dbdd5df42719ebeb649811f9930",
4481
- "IPY_MODEL_99cd2770834e46f69f66d3278d9b68d8",
4482
- "IPY_MODEL_ce59e45e872a4bd38cb4e45e51e22002"
4483
  ],
4484
- "layout": "IPY_MODEL_8bb6af1eecc341c0ac752cb92e9569e0"
4485
  }
4486
  },
4487
- "e8bf0dbdd5df42719ebeb649811f9930": {
4488
  "model_module": "@jupyter-widgets/controls",
4489
  "model_name": "HTMLModel",
4490
  "model_module_version": "1.5.0",
@@ -4499,13 +4499,13 @@
4499
  "_view_name": "HTMLView",
4500
  "description": "",
4501
  "description_tooltip": null,
4502
- "layout": "IPY_MODEL_6eb3710047aa483f8fbf4682ab5567ee",
4503
  "placeholder": "​",
4504
- "style": "IPY_MODEL_b2b6aeb5ed42473db667ee0873ae92c2",
4505
- "value": "config.json: "
4506
  }
4507
  },
4508
- "99cd2770834e46f69f66d3278d9b68d8": {
4509
  "model_module": "@jupyter-widgets/controls",
4510
  "model_name": "FloatProgressModel",
4511
  "model_module_version": "1.5.0",
@@ -4521,15 +4521,15 @@
4521
  "bar_style": "success",
4522
  "description": "",
4523
  "description_tooltip": null,
4524
- "layout": "IPY_MODEL_381951daa8194175aaa1b5ffe848a4dd",
4525
  "max": 1,
4526
  "min": 0,
4527
  "orientation": "horizontal",
4528
- "style": "IPY_MODEL_f4b29be735164ab8ac39979330d0cfa9",
4529
  "value": 1
4530
  }
4531
  },
4532
- "ce59e45e872a4bd38cb4e45e51e22002": {
4533
  "model_module": "@jupyter-widgets/controls",
4534
  "model_name": "HTMLModel",
4535
  "model_module_version": "1.5.0",
@@ -4544,13 +4544,13 @@
4544
  "_view_name": "HTMLView",
4545
  "description": "",
4546
  "description_tooltip": null,
4547
- "layout": "IPY_MODEL_fe16132a615346ada13e1f84a2b2bfb0",
4548
  "placeholder": "​",
4549
- "style": "IPY_MODEL_93eb696a84bc4c7a90262009cc4cec94",
4550
- "value": " 19.3k/? [00:00<00:00, 964kB/s]"
4551
  }
4552
  },
4553
- "8bb6af1eecc341c0ac752cb92e9569e0": {
4554
  "model_module": "@jupyter-widgets/base",
4555
  "model_name": "LayoutModel",
4556
  "model_module_version": "1.2.0",
@@ -4602,7 +4602,7 @@
4602
  "width": null
4603
  }
4604
  },
4605
- "6eb3710047aa483f8fbf4682ab5567ee": {
4606
  "model_module": "@jupyter-widgets/base",
4607
  "model_name": "LayoutModel",
4608
  "model_module_version": "1.2.0",
@@ -4654,7 +4654,7 @@
4654
  "width": null
4655
  }
4656
  },
4657
- "b2b6aeb5ed42473db667ee0873ae92c2": {
4658
  "model_module": "@jupyter-widgets/controls",
4659
  "model_name": "DescriptionStyleModel",
4660
  "model_module_version": "1.5.0",
@@ -4669,7 +4669,7 @@
4669
  "description_width": ""
4670
  }
4671
  },
4672
- "381951daa8194175aaa1b5ffe848a4dd": {
4673
  "model_module": "@jupyter-widgets/base",
4674
  "model_name": "LayoutModel",
4675
  "model_module_version": "1.2.0",
@@ -4721,7 +4721,7 @@
4721
  "width": "20px"
4722
  }
4723
  },
4724
- "f4b29be735164ab8ac39979330d0cfa9": {
4725
  "model_module": "@jupyter-widgets/controls",
4726
  "model_name": "ProgressStyleModel",
4727
  "model_module_version": "1.5.0",
@@ -4737,7 +4737,7 @@
4737
  "description_width": ""
4738
  }
4739
  },
4740
- "fe16132a615346ada13e1f84a2b2bfb0": {
4741
  "model_module": "@jupyter-widgets/base",
4742
  "model_name": "LayoutModel",
4743
  "model_module_version": "1.2.0",
@@ -4789,7 +4789,7 @@
4789
  "width": null
4790
  }
4791
  },
4792
- "93eb696a84bc4c7a90262009cc4cec94": {
4793
  "model_module": "@jupyter-widgets/controls",
4794
  "model_name": "DescriptionStyleModel",
4795
  "model_module_version": "1.5.0",
@@ -4804,7 +4804,7 @@
4804
  "description_width": ""
4805
  }
4806
  },
4807
- "5abd62c5fdfd41a89c1d7e4533dd7c17": {
4808
  "model_module": "@jupyter-widgets/controls",
4809
  "model_name": "HBoxModel",
4810
  "model_module_version": "1.5.0",
@@ -4819,14 +4819,14 @@
4819
  "_view_name": "HBoxView",
4820
  "box_style": "",
4821
  "children": [
4822
- "IPY_MODEL_a11ea11d184f4ce4868d7f70cc4f70ef",
4823
- "IPY_MODEL_30d9459dc22f477b8737984247a6aba7",
4824
- "IPY_MODEL_9af022bc36e547e6bcf12f7ff7752eef"
4825
  ],
4826
- "layout": "IPY_MODEL_6e24f7d587164e88a47cee2e22586832"
4827
  }
4828
  },
4829
- "a11ea11d184f4ce4868d7f70cc4f70ef": {
4830
  "model_module": "@jupyter-widgets/controls",
4831
  "model_name": "HTMLModel",
4832
  "model_module_version": "1.5.0",
@@ -4841,13 +4841,13 @@
4841
  "_view_name": "HTMLView",
4842
  "description": "",
4843
  "description_tooltip": null,
4844
- "layout": "IPY_MODEL_7532d4f9593e4cf7841bcc62c38fef30",
4845
  "placeholder": "​",
4846
- "style": "IPY_MODEL_08407812e0e8454fa0f9f0bf3e8b6628",
4847
- "value": ".gitattributes: 100%"
4848
  }
4849
  },
4850
- "30d9459dc22f477b8737984247a6aba7": {
4851
  "model_module": "@jupyter-widgets/controls",
4852
  "model_name": "FloatProgressModel",
4853
  "model_module_version": "1.5.0",
@@ -4863,15 +4863,15 @@
4863
  "bar_style": "success",
4864
  "description": "",
4865
  "description_tooltip": null,
4866
- "layout": "IPY_MODEL_136f18d8324f4d9bbae7986eee95202f",
4867
- "max": 278,
4868
  "min": 0,
4869
  "orientation": "horizontal",
4870
- "style": "IPY_MODEL_419facde9a2848048feafa9f32db4a84",
4871
- "value": 278
4872
  }
4873
  },
4874
- "9af022bc36e547e6bcf12f7ff7752eef": {
4875
  "model_module": "@jupyter-widgets/controls",
4876
  "model_name": "HTMLModel",
4877
  "model_module_version": "1.5.0",
@@ -4886,13 +4886,13 @@
4886
  "_view_name": "HTMLView",
4887
  "description": "",
4888
  "description_tooltip": null,
4889
- "layout": "IPY_MODEL_c9a9ae53c44b40d5aa0b3314c78a3cd7",
4890
  "placeholder": "​",
4891
- "style": "IPY_MODEL_8995b5a8487746b9b2457cdf1dbaf910",
4892
- "value": " 278/278 [00:00<00:00, 18.4kB/s]"
4893
  }
4894
  },
4895
- "6e24f7d587164e88a47cee2e22586832": {
4896
  "model_module": "@jupyter-widgets/base",
4897
  "model_name": "LayoutModel",
4898
  "model_module_version": "1.2.0",
@@ -4944,7 +4944,7 @@
4944
  "width": null
4945
  }
4946
  },
4947
- "7532d4f9593e4cf7841bcc62c38fef30": {
4948
  "model_module": "@jupyter-widgets/base",
4949
  "model_name": "LayoutModel",
4950
  "model_module_version": "1.2.0",
@@ -4996,7 +4996,7 @@
4996
  "width": null
4997
  }
4998
  },
4999
- "08407812e0e8454fa0f9f0bf3e8b6628": {
5000
  "model_module": "@jupyter-widgets/controls",
5001
  "model_name": "DescriptionStyleModel",
5002
  "model_module_version": "1.5.0",
@@ -5011,7 +5011,7 @@
5011
  "description_width": ""
5012
  }
5013
  },
5014
- "136f18d8324f4d9bbae7986eee95202f": {
5015
  "model_module": "@jupyter-widgets/base",
5016
  "model_name": "LayoutModel",
5017
  "model_module_version": "1.2.0",
@@ -5060,10 +5060,10 @@
5060
  "right": null,
5061
  "top": null,
5062
  "visibility": null,
5063
- "width": null
5064
  }
5065
  },
5066
- "419facde9a2848048feafa9f32db4a84": {
5067
  "model_module": "@jupyter-widgets/controls",
5068
  "model_name": "ProgressStyleModel",
5069
  "model_module_version": "1.5.0",
@@ -5079,7 +5079,7 @@
5079
  "description_width": ""
5080
  }
5081
  },
5082
- "c9a9ae53c44b40d5aa0b3314c78a3cd7": {
5083
  "model_module": "@jupyter-widgets/base",
5084
  "model_name": "LayoutModel",
5085
  "model_module_version": "1.2.0",
@@ -5131,7 +5131,7 @@
5131
  "width": null
5132
  }
5133
  },
5134
- "8995b5a8487746b9b2457cdf1dbaf910": {
5135
  "model_module": "@jupyter-widgets/controls",
5136
  "model_name": "DescriptionStyleModel",
5137
  "model_module_version": "1.5.0",
@@ -5146,7 +5146,7 @@
5146
  "description_width": ""
5147
  }
5148
  },
5149
- "8f11f5be18a04a41a4fdd5f290e430e0": {
5150
  "model_module": "@jupyter-widgets/controls",
5151
  "model_name": "HBoxModel",
5152
  "model_module_version": "1.5.0",
@@ -5161,14 +5161,14 @@
5161
  "_view_name": "HBoxView",
5162
  "box_style": "",
5163
  "children": [
5164
- "IPY_MODEL_437736605824435a9d941aa03c9bd510",
5165
- "IPY_MODEL_311324bf2d23469bb795009d01dfde46",
5166
- "IPY_MODEL_be2bebff25cf4773b527ae3d631cf855"
5167
  ],
5168
- "layout": "IPY_MODEL_5fef1b13a66a4301bb6371574abe851e"
5169
  }
5170
  },
5171
- "437736605824435a9d941aa03c9bd510": {
5172
  "model_module": "@jupyter-widgets/controls",
5173
  "model_name": "HTMLModel",
5174
  "model_module_version": "1.5.0",
@@ -5183,13 +5183,13 @@
5183
  "_view_name": "HTMLView",
5184
  "description": "",
5185
  "description_tooltip": null,
5186
- "layout": "IPY_MODEL_879981a5f9a24ba4bd0fcd77880bcbb3",
5187
  "placeholder": "​",
5188
- "style": "IPY_MODEL_4d517d9a3c60491bbfec3d1315d554ce",
5189
- "value": "model.safetensors.index.json: "
5190
  }
5191
  },
5192
- "311324bf2d23469bb795009d01dfde46": {
5193
  "model_module": "@jupyter-widgets/controls",
5194
  "model_name": "FloatProgressModel",
5195
  "model_module_version": "1.5.0",
@@ -5205,15 +5205,15 @@
5205
  "bar_style": "success",
5206
  "description": "",
5207
  "description_tooltip": null,
5208
- "layout": "IPY_MODEL_7797e48ca26643d7b6cccac9bd7139cc",
5209
  "max": 1,
5210
  "min": 0,
5211
  "orientation": "horizontal",
5212
- "style": "IPY_MODEL_d4323c672ccb49faa5f99337f2734c8c",
5213
  "value": 1
5214
  }
5215
  },
5216
- "be2bebff25cf4773b527ae3d631cf855": {
5217
  "model_module": "@jupyter-widgets/controls",
5218
  "model_name": "HTMLModel",
5219
  "model_module_version": "1.5.0",
@@ -5228,13 +5228,13 @@
5228
  "_view_name": "HTMLView",
5229
  "description": "",
5230
  "description_tooltip": null,
5231
- "layout": "IPY_MODEL_52eeda864e2443aebaab8947d0b5164c",
5232
  "placeholder": "​",
5233
- "style": "IPY_MODEL_40d80a9dda8340dea973269cc765c612",
5234
- "value": " 163k/? [00:00<00:00, 5.37MB/s]"
5235
  }
5236
  },
5237
- "5fef1b13a66a4301bb6371574abe851e": {
5238
  "model_module": "@jupyter-widgets/base",
5239
  "model_name": "LayoutModel",
5240
  "model_module_version": "1.2.0",
@@ -5286,7 +5286,7 @@
5286
  "width": null
5287
  }
5288
  },
5289
- "879981a5f9a24ba4bd0fcd77880bcbb3": {
5290
  "model_module": "@jupyter-widgets/base",
5291
  "model_name": "LayoutModel",
5292
  "model_module_version": "1.2.0",
@@ -5338,7 +5338,7 @@
5338
  "width": null
5339
  }
5340
  },
5341
- "4d517d9a3c60491bbfec3d1315d554ce": {
5342
  "model_module": "@jupyter-widgets/controls",
5343
  "model_name": "DescriptionStyleModel",
5344
  "model_module_version": "1.5.0",
@@ -5353,7 +5353,7 @@
5353
  "description_width": ""
5354
  }
5355
  },
5356
- "7797e48ca26643d7b6cccac9bd7139cc": {
5357
  "model_module": "@jupyter-widgets/base",
5358
  "model_name": "LayoutModel",
5359
  "model_module_version": "1.2.0",
@@ -5405,7 +5405,349 @@
5405
  "width": "20px"
5406
  }
5407
  },
5408
- "d4323c672ccb49faa5f99337f2734c8c": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5409
  "model_module": "@jupyter-widgets/controls",
5410
  "model_name": "ProgressStyleModel",
5411
  "model_module_version": "1.5.0",
@@ -5421,7 +5763,7 @@
5421
  "description_width": ""
5422
  }
5423
  },
5424
- "52eeda864e2443aebaab8947d0b5164c": {
5425
  "model_module": "@jupyter-widgets/base",
5426
  "model_name": "LayoutModel",
5427
  "model_module_version": "1.2.0",
@@ -5473,7 +5815,7 @@
5473
  "width": null
5474
  }
5475
  },
5476
- "40d80a9dda8340dea973269cc765c612": {
5477
  "model_module": "@jupyter-widgets/controls",
5478
  "model_name": "DescriptionStyleModel",
5479
  "model_module_version": "1.5.0",
@@ -6327,100 +6669,111 @@
6327
  "metadata": {
6328
  "colab": {
6329
  "base_uri": "https://localhost:8080/",
6330
- "height": 290,
6331
  "referenced_widgets": [
6332
- "db161b32e9274be58b559b187b6d292a",
6333
- "f7b656d8f6db48a4b2186383cbc84b29",
6334
- "4e828087d74f430ab772b462790a8903",
6335
- "53631f8fedcd4c5b8a4f5dc5768292c5",
6336
- "b8e2f351331041f6bab1eeacf953a2b0",
6337
- "3cbf7135fc77424aaa12cb2c5be57743",
6338
- "a2d41db1f50f4714bbe2a058b7edccaf",
6339
- "a49f9939455349dda171ba76ac1fa329",
6340
- "0508252a7b894233837b0a7fcb57d151",
6341
- "53ef4ff9f2ba4e528e8e59f46b935044",
6342
- "c44afc7fe718421bbc8617d24c56593c",
6343
- "46453419213a433cb3ed6fe07ba5843d",
6344
- "b6d930a1703d4527b2c327cd5e19d676",
6345
- "985ea6752ec84b76853dd5d05d567f82",
6346
- "86316cfe458c46fdbb868fefcec4f4f5",
6347
- "9f24ffe2990844b989ed559e74f99054",
6348
- "91d368dd1b7b4f0e8c5270e4eb04ac5e",
6349
- "d6fbd58fae1b4aa7b93146d787ef7a32",
6350
- "bf9a903226cf45d9b28cfd011530b936",
6351
- "e15742f1f0444e719d2b5c4f38af5451",
6352
- "a25e978eb8954cc7a90d98cb5e354e24",
6353
- "3ff784a2667f419297fde5e70b6cca5b",
6354
- "12d20ba2e2024f69af3b65799894601b",
6355
- "0303cb9e444e447d8d03500004ab2718",
6356
- "efefeea7943c43de8e663642df8cf1ac",
6357
- "69945a2d9e054d549de35fcf5caf7c6d",
6358
- "126fb6973fea44cda0a9f5cab4744178",
6359
- "7df1bad71f074099bfe79851f64ae2f2",
6360
- "da1342b9ae4c44f89a8f776e3695058f",
6361
- "0b6b8be2864a459780b865cb2a06db1d",
6362
- "423c6c5fbd2f4d46b139251b86a29816",
6363
- "1f408f5f289e4641891334ca973c8fc7",
6364
- "a90e33f62cc54ace808528591952b422",
6365
- "c0f9d65172b848e291ea17a1da321f3c",
6366
- "b9c367da4a89412391730169acbbdd35",
6367
- "fdc38ba47f7a4d80abc884ca816c363d",
6368
- "523f648751014635b52f2d4336f4f7d6",
6369
- "f51bc80160e04634996df2f7c5148c3d",
6370
- "34923048e59a4b5aa0743c96493efa51",
6371
- "1bdebdcdaf1843e3aac80469c9337a51",
6372
- "881ffafb32834aeb8bf91870af7c3a42",
6373
- "a547f15f1354431c8542fe0d69326dba",
6374
- "90220217245745bca53a2151e3b1933c",
6375
- "2b0d09f6e6b9414c9c0ab489077de0f0",
6376
- "4b6d4113ffba46d5a7690d762ea224ef",
6377
- "9b5ae64e7bc24bd2bbe62c7f224784c7",
6378
- "d38a6f02f4d24f2e81cc6e025b02d87b",
6379
- "3bc56673e3a64423b065f4cb76af047b",
6380
- "2e016f49b4844cf7b8d0e832d6ba4f89",
6381
- "16dd315649094a63bfc5853276fe77d4",
6382
- "20abd42995f8458d8be78bc79ea33a25",
6383
- "d191833b275b404d85ae6930ed2a0f65",
6384
- "17013d0d78214f3199cf75c86b25d945",
6385
- "5a3b2deebaab4445acd0bd7454d84da9",
6386
- "80e6ba82a36744d48d2a966e07fcfa75",
6387
- "0c272deca15c438c95eb50401e2239c2",
6388
- "e8bf0dbdd5df42719ebeb649811f9930",
6389
- "99cd2770834e46f69f66d3278d9b68d8",
6390
- "ce59e45e872a4bd38cb4e45e51e22002",
6391
- "8bb6af1eecc341c0ac752cb92e9569e0",
6392
- "6eb3710047aa483f8fbf4682ab5567ee",
6393
- "b2b6aeb5ed42473db667ee0873ae92c2",
6394
- "381951daa8194175aaa1b5ffe848a4dd",
6395
- "f4b29be735164ab8ac39979330d0cfa9",
6396
- "fe16132a615346ada13e1f84a2b2bfb0",
6397
- "93eb696a84bc4c7a90262009cc4cec94",
6398
- "5abd62c5fdfd41a89c1d7e4533dd7c17",
6399
- "a11ea11d184f4ce4868d7f70cc4f70ef",
6400
- "30d9459dc22f477b8737984247a6aba7",
6401
- "9af022bc36e547e6bcf12f7ff7752eef",
6402
- "6e24f7d587164e88a47cee2e22586832",
6403
- "7532d4f9593e4cf7841bcc62c38fef30",
6404
- "08407812e0e8454fa0f9f0bf3e8b6628",
6405
- "136f18d8324f4d9bbae7986eee95202f",
6406
- "419facde9a2848048feafa9f32db4a84",
6407
- "c9a9ae53c44b40d5aa0b3314c78a3cd7",
6408
- "8995b5a8487746b9b2457cdf1dbaf910",
6409
- "8f11f5be18a04a41a4fdd5f290e430e0",
6410
- "437736605824435a9d941aa03c9bd510",
6411
- "311324bf2d23469bb795009d01dfde46",
6412
- "be2bebff25cf4773b527ae3d631cf855",
6413
- "5fef1b13a66a4301bb6371574abe851e",
6414
- "879981a5f9a24ba4bd0fcd77880bcbb3",
6415
- "4d517d9a3c60491bbfec3d1315d554ce",
6416
- "7797e48ca26643d7b6cccac9bd7139cc",
6417
- "d4323c672ccb49faa5f99337f2734c8c",
6418
- "52eeda864e2443aebaab8947d0b5164c",
6419
- "40d80a9dda8340dea973269cc765c612"
 
 
 
 
 
 
 
 
 
 
 
6420
  ]
6421
  },
6422
  "id": "d97388b1",
6423
- "outputId": "e7398874-c06f-48cb-9a5b-bcf575c52ead"
6424
  },
6425
  "source": [
6426
  "from huggingface_hub import snapshot_download\n",
@@ -6457,7 +6810,7 @@
6457
  "print(f\"SDNQ Model device: {next(sdnq_model.parameters()).device}\")\n",
6458
  "print(f\"SDNQ Model dtype: {next(sdnq_model.parameters()).dtype}\")"
6459
  ],
6460
- "execution_count": null,
6461
  "outputs": [
6462
  {
6463
  "output_type": "stream",
@@ -6470,12 +6823,26 @@
6470
  "output_type": "display_data",
6471
  "data": {
6472
  "text/plain": [
6473
- "Fetching 7 files: 0%| | 0/7 [00:00<?, ?it/s]"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6474
  ],
6475
  "application/vnd.jupyter.widget-view+json": {
6476
  "version_major": 2,
6477
  "version_minor": 0,
6478
- "model_id": "db161b32e9274be58b559b187b6d292a"
6479
  }
6480
  },
6481
  "metadata": {}
@@ -6484,12 +6851,12 @@
6484
  "output_type": "display_data",
6485
  "data": {
6486
  "text/plain": [
6487
- "model-00002-of-00003.safetensors: 0%| | 0.00/4.34G [00:00<?, ?B/s]"
6488
  ],
6489
  "application/vnd.jupyter.widget-view+json": {
6490
  "version_major": 2,
6491
  "version_minor": 0,
6492
- "model_id": "46453419213a433cb3ed6fe07ba5843d"
6493
  }
6494
  },
6495
  "metadata": {}
@@ -6498,12 +6865,12 @@
6498
  "output_type": "display_data",
6499
  "data": {
6500
  "text/plain": [
6501
- "model-00003-of-00003.safetensors: 0%| | 0.00/2.49G [00:00<?, ?B/s]"
6502
  ],
6503
  "application/vnd.jupyter.widget-view+json": {
6504
  "version_major": 2,
6505
  "version_minor": 0,
6506
- "model_id": "12d20ba2e2024f69af3b65799894601b"
6507
  }
6508
  },
6509
  "metadata": {}
@@ -6512,12 +6879,12 @@
6512
  "output_type": "display_data",
6513
  "data": {
6514
  "text/plain": [
6515
- "model-00001-of-00003.safetensors: 0%| | 0.00/5.00G [00:00<?, ?B/s]"
6516
  ],
6517
  "application/vnd.jupyter.widget-view+json": {
6518
  "version_major": 2,
6519
  "version_minor": 0,
6520
- "model_id": "c0f9d65172b848e291ea17a1da321f3c"
6521
  }
6522
  },
6523
  "metadata": {}
@@ -6526,12 +6893,12 @@
6526
  "output_type": "display_data",
6527
  "data": {
6528
  "text/plain": [
6529
- "generation_config.json: 0%| | 0.00/213 [00:00<?, ?B/s]"
6530
  ],
6531
  "application/vnd.jupyter.widget-view+json": {
6532
  "version_major": 2,
6533
  "version_minor": 0,
6534
- "model_id": "4b6d4113ffba46d5a7690d762ea224ef"
6535
  }
6536
  },
6537
  "metadata": {}
@@ -6540,12 +6907,12 @@
6540
  "output_type": "display_data",
6541
  "data": {
6542
  "text/plain": [
6543
- "config.json: 0.00B [00:00, ?B/s]"
6544
  ],
6545
  "application/vnd.jupyter.widget-view+json": {
6546
  "version_major": 2,
6547
  "version_minor": 0,
6548
- "model_id": "0c272deca15c438c95eb50401e2239c2"
6549
  }
6550
  },
6551
  "metadata": {}
@@ -6554,29 +6921,71 @@
6554
  "output_type": "display_data",
6555
  "data": {
6556
  "text/plain": [
6557
- ".gitattributes: 0%| | 0.00/278 [00:00<?, ?B/s]"
6558
  ],
6559
  "application/vnd.jupyter.widget-view+json": {
6560
  "version_major": 2,
6561
  "version_minor": 0,
6562
- "model_id": "5abd62c5fdfd41a89c1d7e4533dd7c17"
6563
  }
6564
  },
6565
  "metadata": {}
6566
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6567
  {
6568
  "output_type": "display_data",
6569
  "data": {
6570
  "text/plain": [
6571
- "model.safetensors.index.json: 0.00B [00:00, ?B/s]"
6572
  ],
6573
  "application/vnd.jupyter.widget-view+json": {
6574
  "version_major": 2,
6575
  "version_minor": 0,
6576
- "model_id": "8f11f5be18a04a41a4fdd5f290e430e0"
6577
  }
6578
  },
6579
  "metadata": {}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6580
  }
6581
  ]
6582
  },
 
2752
  "description_width": ""
2753
  }
2754
  },
2755
+ "b2d96c62ece74d10ae8cfa0368bdef5d": {
2756
  "model_module": "@jupyter-widgets/controls",
2757
  "model_name": "HBoxModel",
2758
  "model_module_version": "1.5.0",
 
2767
  "_view_name": "HBoxView",
2768
  "box_style": "",
2769
  "children": [
2770
+ "IPY_MODEL_026549e161b746819e82057daa34d013",
2771
+ "IPY_MODEL_5e7403e444914be28ff4dffea6b0e223",
2772
+ "IPY_MODEL_8a47ce5909fa46ab96d5b289c35cb3c2"
2773
  ],
2774
+ "layout": "IPY_MODEL_dcb0c08779074052a98d87804be0ffbc"
2775
  }
2776
  },
2777
+ "026549e161b746819e82057daa34d013": {
2778
  "model_module": "@jupyter-widgets/controls",
2779
  "model_name": "HTMLModel",
2780
  "model_module_version": "1.5.0",
 
2789
  "_view_name": "HTMLView",
2790
  "description": "",
2791
  "description_tooltip": null,
2792
+ "layout": "IPY_MODEL_e02027bec5214982b5c51a556935799e",
2793
  "placeholder": "​",
2794
+ "style": "IPY_MODEL_2d46faefa76e4f03903d970edcab8e6b",
2795
+ "value": "Fetching 17 files: 100%"
2796
  }
2797
  },
2798
+ "5e7403e444914be28ff4dffea6b0e223": {
2799
  "model_module": "@jupyter-widgets/controls",
2800
  "model_name": "FloatProgressModel",
2801
  "model_module_version": "1.5.0",
 
2808
  "_view_module": "@jupyter-widgets/controls",
2809
  "_view_module_version": "1.5.0",
2810
  "_view_name": "ProgressView",
2811
+ "bar_style": "success",
2812
  "description": "",
2813
  "description_tooltip": null,
2814
+ "layout": "IPY_MODEL_252ee04b367841778ae4c89a84c5f1de",
2815
+ "max": 17,
2816
  "min": 0,
2817
  "orientation": "horizontal",
2818
+ "style": "IPY_MODEL_ad5d4df02464404d80de57028d815692",
2819
+ "value": 17
2820
  }
2821
  },
2822
+ "8a47ce5909fa46ab96d5b289c35cb3c2": {
2823
  "model_module": "@jupyter-widgets/controls",
2824
  "model_name": "HTMLModel",
2825
  "model_module_version": "1.5.0",
 
2834
  "_view_name": "HTMLView",
2835
  "description": "",
2836
  "description_tooltip": null,
2837
+ "layout": "IPY_MODEL_c7b6596488a04171b96271bb41a918ca",
2838
  "placeholder": "​",
2839
+ "style": "IPY_MODEL_dce80ab74a6d41afbeb65708f855edb5",
2840
+ "value": " 17/17 [00:01&lt;00:00,  7.95it/s]"
2841
  }
2842
  },
2843
+ "dcb0c08779074052a98d87804be0ffbc": {
2844
  "model_module": "@jupyter-widgets/base",
2845
  "model_name": "LayoutModel",
2846
  "model_module_version": "1.2.0",
 
2892
  "width": null
2893
  }
2894
  },
2895
+ "e02027bec5214982b5c51a556935799e": {
2896
  "model_module": "@jupyter-widgets/base",
2897
  "model_name": "LayoutModel",
2898
  "model_module_version": "1.2.0",
 
2944
  "width": null
2945
  }
2946
  },
2947
+ "2d46faefa76e4f03903d970edcab8e6b": {
2948
  "model_module": "@jupyter-widgets/controls",
2949
  "model_name": "DescriptionStyleModel",
2950
  "model_module_version": "1.5.0",
 
2959
  "description_width": ""
2960
  }
2961
  },
2962
+ "252ee04b367841778ae4c89a84c5f1de": {
2963
  "model_module": "@jupyter-widgets/base",
2964
  "model_name": "LayoutModel",
2965
  "model_module_version": "1.2.0",
 
3011
  "width": null
3012
  }
3013
  },
3014
+ "ad5d4df02464404d80de57028d815692": {
3015
  "model_module": "@jupyter-widgets/controls",
3016
  "model_name": "ProgressStyleModel",
3017
  "model_module_version": "1.5.0",
 
3027
  "description_width": ""
3028
  }
3029
  },
3030
+ "c7b6596488a04171b96271bb41a918ca": {
3031
  "model_module": "@jupyter-widgets/base",
3032
  "model_name": "LayoutModel",
3033
  "model_module_version": "1.2.0",
 
3079
  "width": null
3080
  }
3081
  },
3082
+ "dce80ab74a6d41afbeb65708f855edb5": {
3083
  "model_module": "@jupyter-widgets/controls",
3084
  "model_name": "DescriptionStyleModel",
3085
  "model_module_version": "1.5.0",
 
3094
  "description_width": ""
3095
  }
3096
  },
3097
+ "2bc646b6c1224558b1513c2e8d3aeec4": {
3098
  "model_module": "@jupyter-widgets/controls",
3099
  "model_name": "HBoxModel",
3100
  "model_module_version": "1.5.0",
 
3109
  "_view_name": "HBoxView",
3110
  "box_style": "",
3111
  "children": [
3112
+ "IPY_MODEL_5eae870a01094dc2a79a1e9580ecd0e3",
3113
+ "IPY_MODEL_aae3998d02b542349a0d63efdc796f5f",
3114
+ "IPY_MODEL_db3eb513d928461cb9f29c7a81a70eef"
3115
  ],
3116
+ "layout": "IPY_MODEL_6b9b92000d0243669e0b4488aa490109"
3117
  }
3118
  },
3119
+ "5eae870a01094dc2a79a1e9580ecd0e3": {
3120
  "model_module": "@jupyter-widgets/controls",
3121
  "model_name": "HTMLModel",
3122
  "model_module_version": "1.5.0",
 
3131
  "_view_name": "HTMLView",
3132
  "description": "",
3133
  "description_tooltip": null,
3134
+ "layout": "IPY_MODEL_1a24e8e6ef0c4181831de003c8576d88",
3135
  "placeholder": "​",
3136
+ "style": "IPY_MODEL_66d73112d71d441f9b87cac7169491f8",
3137
+ "value": "chat_template.json:"
3138
  }
3139
  },
3140
+ "aae3998d02b542349a0d63efdc796f5f": {
3141
  "model_module": "@jupyter-widgets/controls",
3142
  "model_name": "FloatProgressModel",
3143
  "model_module_version": "1.5.0",
 
3150
  "_view_module": "@jupyter-widgets/controls",
3151
  "_view_module_version": "1.5.0",
3152
  "_view_name": "ProgressView",
3153
+ "bar_style": "success",
3154
  "description": "",
3155
  "description_tooltip": null,
3156
+ "layout": "IPY_MODEL_8b46745fb1764422869c83b231197585",
3157
+ "max": 1,
3158
  "min": 0,
3159
  "orientation": "horizontal",
3160
+ "style": "IPY_MODEL_05b38f4f3a97411495f7678a938fd371",
3161
+ "value": 1
3162
  }
3163
  },
3164
+ "db3eb513d928461cb9f29c7a81a70eef": {
3165
  "model_module": "@jupyter-widgets/controls",
3166
  "model_name": "HTMLModel",
3167
  "model_module_version": "1.5.0",
 
3176
  "_view_name": "HTMLView",
3177
  "description": "",
3178
  "description_tooltip": null,
3179
+ "layout": "IPY_MODEL_f0942e71542048a49ee438966bac45ac",
3180
  "placeholder": "​",
3181
+ "style": "IPY_MODEL_ae73e40ccac5442494b570893f5e1d23",
3182
+ "value": " 5.50k/? [00:00&lt;00:00, 144kB/s]"
3183
  }
3184
  },
3185
+ "6b9b92000d0243669e0b4488aa490109": {
3186
  "model_module": "@jupyter-widgets/base",
3187
  "model_name": "LayoutModel",
3188
  "model_module_version": "1.2.0",
 
3234
  "width": null
3235
  }
3236
  },
3237
+ "1a24e8e6ef0c4181831de003c8576d88": {
3238
  "model_module": "@jupyter-widgets/base",
3239
  "model_name": "LayoutModel",
3240
  "model_module_version": "1.2.0",
 
3286
  "width": null
3287
  }
3288
  },
3289
+ "66d73112d71d441f9b87cac7169491f8": {
3290
  "model_module": "@jupyter-widgets/controls",
3291
  "model_name": "DescriptionStyleModel",
3292
  "model_module_version": "1.5.0",
 
3301
  "description_width": ""
3302
  }
3303
  },
3304
+ "8b46745fb1764422869c83b231197585": {
3305
  "model_module": "@jupyter-widgets/base",
3306
  "model_name": "LayoutModel",
3307
  "model_module_version": "1.2.0",
 
3350
  "right": null,
3351
  "top": null,
3352
  "visibility": null,
3353
+ "width": "20px"
3354
  }
3355
  },
3356
+ "05b38f4f3a97411495f7678a938fd371": {
3357
  "model_module": "@jupyter-widgets/controls",
3358
  "model_name": "ProgressStyleModel",
3359
  "model_module_version": "1.5.0",
 
3369
  "description_width": ""
3370
  }
3371
  },
3372
+ "f0942e71542048a49ee438966bac45ac": {
3373
  "model_module": "@jupyter-widgets/base",
3374
  "model_name": "LayoutModel",
3375
  "model_module_version": "1.2.0",
 
3421
  "width": null
3422
  }
3423
  },
3424
+ "ae73e40ccac5442494b570893f5e1d23": {
3425
  "model_module": "@jupyter-widgets/controls",
3426
  "model_name": "DescriptionStyleModel",
3427
  "model_module_version": "1.5.0",
 
3436
  "description_width": ""
3437
  }
3438
  },
3439
+ "8c53093a52d249a4b10e8dad950aef62": {
3440
  "model_module": "@jupyter-widgets/controls",
3441
  "model_name": "HBoxModel",
3442
  "model_module_version": "1.5.0",
 
3451
  "_view_name": "HBoxView",
3452
  "box_style": "",
3453
  "children": [
3454
+ "IPY_MODEL_24d3d9a8ea6a4303be819fde09d698e6",
3455
+ "IPY_MODEL_804b4627bb59452b8d97a304a0beaa99",
3456
+ "IPY_MODEL_12cd9edc9fd844d09a20bd61e359da61"
3457
  ],
3458
+ "layout": "IPY_MODEL_410df68c5f5a48c8b5d7a6d7f0f3f0ee"
3459
  }
3460
  },
3461
+ "24d3d9a8ea6a4303be819fde09d698e6": {
3462
  "model_module": "@jupyter-widgets/controls",
3463
  "model_name": "HTMLModel",
3464
  "model_module_version": "1.5.0",
 
3473
  "_view_name": "HTMLView",
3474
  "description": "",
3475
  "description_tooltip": null,
3476
+ "layout": "IPY_MODEL_3b0bd0450cf440819aa6b56243d86719",
3477
  "placeholder": "​",
3478
+ "style": "IPY_MODEL_bafb910ffc8542e0a4a82ac2c5541b0b",
3479
+ "value": "merges.txt:"
3480
  }
3481
  },
3482
+ "804b4627bb59452b8d97a304a0beaa99": {
3483
  "model_module": "@jupyter-widgets/controls",
3484
  "model_name": "FloatProgressModel",
3485
  "model_module_version": "1.5.0",
 
3492
  "_view_module": "@jupyter-widgets/controls",
3493
  "_view_module_version": "1.5.0",
3494
  "_view_name": "ProgressView",
3495
+ "bar_style": "success",
3496
  "description": "",
3497
  "description_tooltip": null,
3498
+ "layout": "IPY_MODEL_654e38a251db4c54a0cab8358e08ae54",
3499
+ "max": 1,
3500
  "min": 0,
3501
  "orientation": "horizontal",
3502
+ "style": "IPY_MODEL_8193406afd25421b8d7125a3d694f7ee",
3503
+ "value": 1
3504
  }
3505
  },
3506
+ "12cd9edc9fd844d09a20bd61e359da61": {
3507
  "model_module": "@jupyter-widgets/controls",
3508
  "model_name": "HTMLModel",
3509
  "model_module_version": "1.5.0",
 
3518
  "_view_name": "HTMLView",
3519
  "description": "",
3520
  "description_tooltip": null,
3521
+ "layout": "IPY_MODEL_ca7a2197dff34c8696f38de9eb483101",
3522
  "placeholder": "​",
3523
+ "style": "IPY_MODEL_5682a9e270a84eb3a137ba6c454e754e",
3524
+ "value": " 1.67M/? [00:00&lt;00:00, 13.7MB/s]"
3525
  }
3526
  },
3527
+ "410df68c5f5a48c8b5d7a6d7f0f3f0ee": {
3528
  "model_module": "@jupyter-widgets/base",
3529
  "model_name": "LayoutModel",
3530
  "model_module_version": "1.2.0",
 
3576
  "width": null
3577
  }
3578
  },
3579
+ "3b0bd0450cf440819aa6b56243d86719": {
3580
  "model_module": "@jupyter-widgets/base",
3581
  "model_name": "LayoutModel",
3582
  "model_module_version": "1.2.0",
 
3628
  "width": null
3629
  }
3630
  },
3631
+ "bafb910ffc8542e0a4a82ac2c5541b0b": {
3632
  "model_module": "@jupyter-widgets/controls",
3633
  "model_name": "DescriptionStyleModel",
3634
  "model_module_version": "1.5.0",
 
3643
  "description_width": ""
3644
  }
3645
  },
3646
+ "654e38a251db4c54a0cab8358e08ae54": {
3647
  "model_module": "@jupyter-widgets/base",
3648
  "model_name": "LayoutModel",
3649
  "model_module_version": "1.2.0",
 
3692
  "right": null,
3693
  "top": null,
3694
  "visibility": null,
3695
+ "width": "20px"
3696
  }
3697
  },
3698
+ "8193406afd25421b8d7125a3d694f7ee": {
3699
  "model_module": "@jupyter-widgets/controls",
3700
  "model_name": "ProgressStyleModel",
3701
  "model_module_version": "1.5.0",
 
3711
  "description_width": ""
3712
  }
3713
  },
3714
+ "ca7a2197dff34c8696f38de9eb483101": {
3715
  "model_module": "@jupyter-widgets/base",
3716
  "model_name": "LayoutModel",
3717
  "model_module_version": "1.2.0",
 
3763
  "width": null
3764
  }
3765
  },
3766
+ "5682a9e270a84eb3a137ba6c454e754e": {
3767
  "model_module": "@jupyter-widgets/controls",
3768
  "model_name": "DescriptionStyleModel",
3769
  "model_module_version": "1.5.0",
 
3778
  "description_width": ""
3779
  }
3780
  },
3781
+ "d2ea7cdbe39f421eac88fd60c07832aa": {
3782
  "model_module": "@jupyter-widgets/controls",
3783
  "model_name": "HBoxModel",
3784
  "model_module_version": "1.5.0",
 
3793
  "_view_name": "HBoxView",
3794
  "box_style": "",
3795
  "children": [
3796
+ "IPY_MODEL_3aad576dd5e044479ee1bc791098be6e",
3797
+ "IPY_MODEL_aee48a66747c4b49ab797f51fabb81dd",
3798
+ "IPY_MODEL_4cae1daba91a4a89a7a9dcb1196c1ff7"
3799
  ],
3800
+ "layout": "IPY_MODEL_b39a87f5da9241b08b203cb9e5d1ce68"
3801
  }
3802
  },
3803
+ "3aad576dd5e044479ee1bc791098be6e": {
3804
  "model_module": "@jupyter-widgets/controls",
3805
  "model_name": "HTMLModel",
3806
  "model_module_version": "1.5.0",
 
3815
  "_view_name": "HTMLView",
3816
  "description": "",
3817
  "description_tooltip": null,
3818
+ "layout": "IPY_MODEL_8352137c9363487cb401a11fb5982525",
3819
  "placeholder": "​",
3820
+ "style": "IPY_MODEL_486195810e3541d983e47541fba191ca",
3821
+ "value": "generation_config.json: 100%"
3822
  }
3823
  },
3824
+ "aee48a66747c4b49ab797f51fabb81dd": {
3825
  "model_module": "@jupyter-widgets/controls",
3826
  "model_name": "FloatProgressModel",
3827
  "model_module_version": "1.5.0",
 
3834
  "_view_module": "@jupyter-widgets/controls",
3835
  "_view_module_version": "1.5.0",
3836
  "_view_name": "ProgressView",
3837
+ "bar_style": "success",
3838
  "description": "",
3839
  "description_tooltip": null,
3840
+ "layout": "IPY_MODEL_a258a629af19449a9491965645d4b79f",
3841
+ "max": 269,
3842
  "min": 0,
3843
  "orientation": "horizontal",
3844
+ "style": "IPY_MODEL_40681743310747cd833de001a3f23c95",
3845
+ "value": 269
3846
  }
3847
  },
3848
+ "4cae1daba91a4a89a7a9dcb1196c1ff7": {
3849
  "model_module": "@jupyter-widgets/controls",
3850
  "model_name": "HTMLModel",
3851
  "model_module_version": "1.5.0",
 
3860
  "_view_name": "HTMLView",
3861
  "description": "",
3862
  "description_tooltip": null,
3863
+ "layout": "IPY_MODEL_281a36b73f884585bd5f2693409bfdc0",
3864
  "placeholder": "​",
3865
+ "style": "IPY_MODEL_8fa74caaaa9b4074927c483173e7483e",
3866
+ "value": " 269/269 [00:00&lt;00:00, 4.56kB/s]"
3867
  }
3868
  },
3869
+ "b39a87f5da9241b08b203cb9e5d1ce68": {
3870
  "model_module": "@jupyter-widgets/base",
3871
  "model_name": "LayoutModel",
3872
  "model_module_version": "1.2.0",
 
3918
  "width": null
3919
  }
3920
  },
3921
+ "8352137c9363487cb401a11fb5982525": {
3922
  "model_module": "@jupyter-widgets/base",
3923
  "model_name": "LayoutModel",
3924
  "model_module_version": "1.2.0",
 
3970
  "width": null
3971
  }
3972
  },
3973
+ "486195810e3541d983e47541fba191ca": {
3974
  "model_module": "@jupyter-widgets/controls",
3975
  "model_name": "DescriptionStyleModel",
3976
  "model_module_version": "1.5.0",
 
3985
  "description_width": ""
3986
  }
3987
  },
3988
+ "a258a629af19449a9491965645d4b79f": {
3989
  "model_module": "@jupyter-widgets/base",
3990
  "model_name": "LayoutModel",
3991
  "model_module_version": "1.2.0",
 
4037
  "width": null
4038
  }
4039
  },
4040
+ "40681743310747cd833de001a3f23c95": {
4041
  "model_module": "@jupyter-widgets/controls",
4042
  "model_name": "ProgressStyleModel",
4043
  "model_module_version": "1.5.0",
 
4053
  "description_width": ""
4054
  }
4055
  },
4056
+ "281a36b73f884585bd5f2693409bfdc0": {
4057
  "model_module": "@jupyter-widgets/base",
4058
  "model_name": "LayoutModel",
4059
  "model_module_version": "1.2.0",
 
4105
  "width": null
4106
  }
4107
  },
4108
+ "8fa74caaaa9b4074927c483173e7483e": {
4109
  "model_module": "@jupyter-widgets/controls",
4110
  "model_name": "DescriptionStyleModel",
4111
  "model_module_version": "1.5.0",
 
4120
  "description_width": ""
4121
  }
4122
  },
4123
+ "0517d3ca8f754dda9c05c58df468f389": {
4124
  "model_module": "@jupyter-widgets/controls",
4125
  "model_name": "HBoxModel",
4126
  "model_module_version": "1.5.0",
 
4135
  "_view_name": "HBoxView",
4136
  "box_style": "",
4137
  "children": [
4138
+ "IPY_MODEL_36255a6081fb4f5890671a5b134d2a88",
4139
+ "IPY_MODEL_91af530b9b00467d8ffe60f53d1ed3f7",
4140
+ "IPY_MODEL_6c5eec9d403d4852a914ec14856842d2"
4141
  ],
4142
+ "layout": "IPY_MODEL_e9ed79822b28466cb6e987928d3217ac"
4143
  }
4144
  },
4145
+ "36255a6081fb4f5890671a5b134d2a88": {
4146
  "model_module": "@jupyter-widgets/controls",
4147
  "model_name": "HTMLModel",
4148
  "model_module_version": "1.5.0",
 
4157
  "_view_name": "HTMLView",
4158
  "description": "",
4159
  "description_tooltip": null,
4160
+ "layout": "IPY_MODEL_ebe0443397974147b3845cc9e9aa20e7",
4161
  "placeholder": "​",
4162
+ "style": "IPY_MODEL_dd8ffc95d9074bf78bcb6a3b656fdf8d",
4163
+ "value": "configuration.json: 100%"
4164
  }
4165
  },
4166
+ "91af530b9b00467d8ffe60f53d1ed3f7": {
4167
  "model_module": "@jupyter-widgets/controls",
4168
  "model_name": "FloatProgressModel",
4169
  "model_module_version": "1.5.0",
 
4179
  "bar_style": "success",
4180
  "description": "",
4181
  "description_tooltip": null,
4182
+ "layout": "IPY_MODEL_5cb9185af5694c28b2e0e314539c6aed",
4183
+ "max": 73,
4184
  "min": 0,
4185
  "orientation": "horizontal",
4186
+ "style": "IPY_MODEL_b058573d771f4642b62d41ff16e0a668",
4187
+ "value": 73
4188
  }
4189
  },
4190
+ "6c5eec9d403d4852a914ec14856842d2": {
4191
  "model_module": "@jupyter-widgets/controls",
4192
  "model_name": "HTMLModel",
4193
  "model_module_version": "1.5.0",
 
4202
  "_view_name": "HTMLView",
4203
  "description": "",
4204
  "description_tooltip": null,
4205
+ "layout": "IPY_MODEL_f32f3cc12fa742f598781ab674db1b72",
4206
  "placeholder": "​",
4207
+ "style": "IPY_MODEL_980b0da3463c4f8ba6afb7b25814c9fd",
4208
+ "value": " 73.0/73.0 [00:00&lt;00:00, 1.26kB/s]"
4209
  }
4210
  },
4211
+ "e9ed79822b28466cb6e987928d3217ac": {
4212
  "model_module": "@jupyter-widgets/base",
4213
  "model_name": "LayoutModel",
4214
  "model_module_version": "1.2.0",
 
4260
  "width": null
4261
  }
4262
  },
4263
+ "ebe0443397974147b3845cc9e9aa20e7": {
4264
  "model_module": "@jupyter-widgets/base",
4265
  "model_name": "LayoutModel",
4266
  "model_module_version": "1.2.0",
 
4312
  "width": null
4313
  }
4314
  },
4315
+ "dd8ffc95d9074bf78bcb6a3b656fdf8d": {
4316
  "model_module": "@jupyter-widgets/controls",
4317
  "model_name": "DescriptionStyleModel",
4318
  "model_module_version": "1.5.0",
 
4327
  "description_width": ""
4328
  }
4329
  },
4330
+ "5cb9185af5694c28b2e0e314539c6aed": {
4331
  "model_module": "@jupyter-widgets/base",
4332
  "model_name": "LayoutModel",
4333
  "model_module_version": "1.2.0",
 
4379
  "width": null
4380
  }
4381
  },
4382
+ "b058573d771f4642b62d41ff16e0a668": {
4383
  "model_module": "@jupyter-widgets/controls",
4384
  "model_name": "ProgressStyleModel",
4385
  "model_module_version": "1.5.0",
 
4395
  "description_width": ""
4396
  }
4397
  },
4398
+ "f32f3cc12fa742f598781ab674db1b72": {
4399
  "model_module": "@jupyter-widgets/base",
4400
  "model_name": "LayoutModel",
4401
  "model_module_version": "1.2.0",
 
4447
  "width": null
4448
  }
4449
  },
4450
+ "980b0da3463c4f8ba6afb7b25814c9fd": {
4451
  "model_module": "@jupyter-widgets/controls",
4452
  "model_name": "DescriptionStyleModel",
4453
  "model_module_version": "1.5.0",
 
4462
  "description_width": ""
4463
  }
4464
  },
4465
+ "b4dbd23ca854403b98b3550f10672c3d": {
4466
  "model_module": "@jupyter-widgets/controls",
4467
  "model_name": "HBoxModel",
4468
  "model_module_version": "1.5.0",
 
4477
  "_view_name": "HBoxView",
4478
  "box_style": "",
4479
  "children": [
4480
+ "IPY_MODEL_7fb9acd8bf0c495baec3ee9710bbb83d",
4481
+ "IPY_MODEL_1198981dbe814b998b1ec872a7429910",
4482
+ "IPY_MODEL_ed1e88050a704cd89810b3e7aa5aa3ff"
4483
  ],
4484
+ "layout": "IPY_MODEL_d6a29cbf2da04b6cbc8fddef4ed90189"
4485
  }
4486
  },
4487
+ "7fb9acd8bf0c495baec3ee9710bbb83d": {
4488
  "model_module": "@jupyter-widgets/controls",
4489
  "model_name": "HTMLModel",
4490
  "model_module_version": "1.5.0",
 
4499
  "_view_name": "HTMLView",
4500
  "description": "",
4501
  "description_tooltip": null,
4502
+ "layout": "IPY_MODEL_d7e48b4cfc5b4effaa560d645a6d5ce1",
4503
  "placeholder": "​",
4504
+ "style": "IPY_MODEL_8447bf99e9c6467f93b3937d0dcdceee",
4505
+ "value": "tokenizer.json: "
4506
  }
4507
  },
4508
+ "1198981dbe814b998b1ec872a7429910": {
4509
  "model_module": "@jupyter-widgets/controls",
4510
  "model_name": "FloatProgressModel",
4511
  "model_module_version": "1.5.0",
 
4521
  "bar_style": "success",
4522
  "description": "",
4523
  "description_tooltip": null,
4524
+ "layout": "IPY_MODEL_424d45e11fd74590be78c9c8340ace40",
4525
  "max": 1,
4526
  "min": 0,
4527
  "orientation": "horizontal",
4528
+ "style": "IPY_MODEL_940723bf0502461a8804999207eda050",
4529
  "value": 1
4530
  }
4531
  },
4532
+ "ed1e88050a704cd89810b3e7aa5aa3ff": {
4533
  "model_module": "@jupyter-widgets/controls",
4534
  "model_name": "HTMLModel",
4535
  "model_module_version": "1.5.0",
 
4544
  "_view_name": "HTMLView",
4545
  "description": "",
4546
  "description_tooltip": null,
4547
+ "layout": "IPY_MODEL_9d6faeb02b2a4195a2c3975d81050c86",
4548
  "placeholder": "​",
4549
+ "style": "IPY_MODEL_70de2bd915c040e499d2165ab44c8b87",
4550
+ "value": " 7.03M/? [00:00&lt;00:00, 17.0MB/s]"
4551
  }
4552
  },
4553
+ "d6a29cbf2da04b6cbc8fddef4ed90189": {
4554
  "model_module": "@jupyter-widgets/base",
4555
  "model_name": "LayoutModel",
4556
  "model_module_version": "1.2.0",
 
4602
  "width": null
4603
  }
4604
  },
4605
+ "d7e48b4cfc5b4effaa560d645a6d5ce1": {
4606
  "model_module": "@jupyter-widgets/base",
4607
  "model_name": "LayoutModel",
4608
  "model_module_version": "1.2.0",
 
4654
  "width": null
4655
  }
4656
  },
4657
+ "8447bf99e9c6467f93b3937d0dcdceee": {
4658
  "model_module": "@jupyter-widgets/controls",
4659
  "model_name": "DescriptionStyleModel",
4660
  "model_module_version": "1.5.0",
 
4669
  "description_width": ""
4670
  }
4671
  },
4672
+ "424d45e11fd74590be78c9c8340ace40": {
4673
  "model_module": "@jupyter-widgets/base",
4674
  "model_name": "LayoutModel",
4675
  "model_module_version": "1.2.0",
 
4721
  "width": "20px"
4722
  }
4723
  },
4724
+ "940723bf0502461a8804999207eda050": {
4725
  "model_module": "@jupyter-widgets/controls",
4726
  "model_name": "ProgressStyleModel",
4727
  "model_module_version": "1.5.0",
 
4737
  "description_width": ""
4738
  }
4739
  },
4740
+ "9d6faeb02b2a4195a2c3975d81050c86": {
4741
  "model_module": "@jupyter-widgets/base",
4742
  "model_name": "LayoutModel",
4743
  "model_module_version": "1.2.0",
 
4789
  "width": null
4790
  }
4791
  },
4792
+ "70de2bd915c040e499d2165ab44c8b87": {
4793
  "model_module": "@jupyter-widgets/controls",
4794
  "model_name": "DescriptionStyleModel",
4795
  "model_module_version": "1.5.0",
 
4804
  "description_width": ""
4805
  }
4806
  },
4807
+ "067b7146c43d409d8279ba5f1add3d37": {
4808
  "model_module": "@jupyter-widgets/controls",
4809
  "model_name": "HBoxModel",
4810
  "model_module_version": "1.5.0",
 
4819
  "_view_name": "HBoxView",
4820
  "box_style": "",
4821
  "children": [
4822
+ "IPY_MODEL_212e1703f3234410b6b4babb3fcdff31",
4823
+ "IPY_MODEL_17f7e5c1bcbe4c1fbf1d9e5a68c88174",
4824
+ "IPY_MODEL_38a0b812722446a0adfdf432d178bca3"
4825
  ],
4826
+ "layout": "IPY_MODEL_8412d6436c234fb2b0fbe4c6109bcc11"
4827
  }
4828
  },
4829
+ "212e1703f3234410b6b4babb3fcdff31": {
4830
  "model_module": "@jupyter-widgets/controls",
4831
  "model_name": "HTMLModel",
4832
  "model_module_version": "1.5.0",
 
4841
  "_view_name": "HTMLView",
4842
  "description": "",
4843
  "description_tooltip": null,
4844
+ "layout": "IPY_MODEL_d161beab3f8c4ed3b7e1e99a50e0d682",
4845
  "placeholder": "​",
4846
+ "style": "IPY_MODEL_1a2d30a8995e4de5bc16f9c77723cc14",
4847
+ "value": "tokenizer_config.json: "
4848
  }
4849
  },
4850
+ "17f7e5c1bcbe4c1fbf1d9e5a68c88174": {
4851
  "model_module": "@jupyter-widgets/controls",
4852
  "model_name": "FloatProgressModel",
4853
  "model_module_version": "1.5.0",
 
4863
  "bar_style": "success",
4864
  "description": "",
4865
  "description_tooltip": null,
4866
+ "layout": "IPY_MODEL_a50c1c8ef59641a096560837ad19102d",
4867
+ "max": 1,
4868
  "min": 0,
4869
  "orientation": "horizontal",
4870
+ "style": "IPY_MODEL_6ac5b6703d3b4764a4024d529663c4bb",
4871
+ "value": 1
4872
  }
4873
  },
4874
+ "38a0b812722446a0adfdf432d178bca3": {
4875
  "model_module": "@jupyter-widgets/controls",
4876
  "model_name": "HTMLModel",
4877
  "model_module_version": "1.5.0",
 
4886
  "_view_name": "HTMLView",
4887
  "description": "",
4888
  "description_tooltip": null,
4889
+ "layout": "IPY_MODEL_22ae462317594dedaf012ba3baa5feb5",
4890
  "placeholder": "​",
4891
+ "style": "IPY_MODEL_e4b83d48686c4850ac698602ab9d6ae5",
4892
+ "value": " 11.0k/? [00:00&lt;00:00, 670kB/s]"
4893
  }
4894
  },
4895
+ "8412d6436c234fb2b0fbe4c6109bcc11": {
4896
  "model_module": "@jupyter-widgets/base",
4897
  "model_name": "LayoutModel",
4898
  "model_module_version": "1.2.0",
 
4944
  "width": null
4945
  }
4946
  },
4947
+ "d161beab3f8c4ed3b7e1e99a50e0d682": {
4948
  "model_module": "@jupyter-widgets/base",
4949
  "model_name": "LayoutModel",
4950
  "model_module_version": "1.2.0",
 
4996
  "width": null
4997
  }
4998
  },
4999
+ "1a2d30a8995e4de5bc16f9c77723cc14": {
5000
  "model_module": "@jupyter-widgets/controls",
5001
  "model_name": "DescriptionStyleModel",
5002
  "model_module_version": "1.5.0",
 
5011
  "description_width": ""
5012
  }
5013
  },
5014
+ "a50c1c8ef59641a096560837ad19102d": {
5015
  "model_module": "@jupyter-widgets/base",
5016
  "model_name": "LayoutModel",
5017
  "model_module_version": "1.2.0",
 
5060
  "right": null,
5061
  "top": null,
5062
  "visibility": null,
5063
+ "width": "20px"
5064
  }
5065
  },
5066
+ "6ac5b6703d3b4764a4024d529663c4bb": {
5067
  "model_module": "@jupyter-widgets/controls",
5068
  "model_name": "ProgressStyleModel",
5069
  "model_module_version": "1.5.0",
 
5079
  "description_width": ""
5080
  }
5081
  },
5082
+ "22ae462317594dedaf012ba3baa5feb5": {
5083
  "model_module": "@jupyter-widgets/base",
5084
  "model_name": "LayoutModel",
5085
  "model_module_version": "1.2.0",
 
5131
  "width": null
5132
  }
5133
  },
5134
+ "e4b83d48686c4850ac698602ab9d6ae5": {
5135
  "model_module": "@jupyter-widgets/controls",
5136
  "model_name": "DescriptionStyleModel",
5137
  "model_module_version": "1.5.0",
 
5146
  "description_width": ""
5147
  }
5148
  },
5149
+ "96eab2db9f1c47e3be7f05e17dd4bc2e": {
5150
  "model_module": "@jupyter-widgets/controls",
5151
  "model_name": "HBoxModel",
5152
  "model_module_version": "1.5.0",
 
5161
  "_view_name": "HBoxView",
5162
  "box_style": "",
5163
  "children": [
5164
+ "IPY_MODEL_bac648fd4d524113acc6dc6935080b7d",
5165
+ "IPY_MODEL_bbf592fa8a9a47f4a1ca4cce63d1de5b",
5166
+ "IPY_MODEL_520912d0ea104132abe22ceda62df8df"
5167
  ],
5168
+ "layout": "IPY_MODEL_0eccb66584b84bb496e2897fb7336893"
5169
  }
5170
  },
5171
+ "bac648fd4d524113acc6dc6935080b7d": {
5172
  "model_module": "@jupyter-widgets/controls",
5173
  "model_name": "HTMLModel",
5174
  "model_module_version": "1.5.0",
 
5183
  "_view_name": "HTMLView",
5184
  "description": "",
5185
  "description_tooltip": null,
5186
+ "layout": "IPY_MODEL_6ebbe27bf2fa4f939e374b414efa74f3",
5187
  "placeholder": "​",
5188
+ "style": "IPY_MODEL_81673221a8194854b93519890687c6b3",
5189
+ "value": "vocab.json: "
5190
  }
5191
  },
5192
+ "bbf592fa8a9a47f4a1ca4cce63d1de5b": {
5193
  "model_module": "@jupyter-widgets/controls",
5194
  "model_name": "FloatProgressModel",
5195
  "model_module_version": "1.5.0",
 
5205
  "bar_style": "success",
5206
  "description": "",
5207
  "description_tooltip": null,
5208
+ "layout": "IPY_MODEL_5dfc118f189f49058104d850fcef4cfe",
5209
  "max": 1,
5210
  "min": 0,
5211
  "orientation": "horizontal",
5212
+ "style": "IPY_MODEL_ad218808233a46b79defe021a831730d",
5213
  "value": 1
5214
  }
5215
  },
5216
+ "520912d0ea104132abe22ceda62df8df": {
5217
  "model_module": "@jupyter-widgets/controls",
5218
  "model_name": "HTMLModel",
5219
  "model_module_version": "1.5.0",
 
5228
  "_view_name": "HTMLView",
5229
  "description": "",
5230
  "description_tooltip": null,
5231
+ "layout": "IPY_MODEL_4064b1e4ff5144508f4c2cf414297354",
5232
  "placeholder": "​",
5233
+ "style": "IPY_MODEL_e39c8e68b39549dfb33327e4b1e0cbf8",
5234
+ "value": " 2.78M/? [00:00&lt;00:00, 9.53MB/s]"
5235
  }
5236
  },
5237
+ "0eccb66584b84bb496e2897fb7336893": {
5238
  "model_module": "@jupyter-widgets/base",
5239
  "model_name": "LayoutModel",
5240
  "model_module_version": "1.2.0",
 
5286
  "width": null
5287
  }
5288
  },
5289
+ "6ebbe27bf2fa4f939e374b414efa74f3": {
5290
  "model_module": "@jupyter-widgets/base",
5291
  "model_name": "LayoutModel",
5292
  "model_module_version": "1.2.0",
 
5338
  "width": null
5339
  }
5340
  },
5341
+ "81673221a8194854b93519890687c6b3": {
5342
  "model_module": "@jupyter-widgets/controls",
5343
  "model_name": "DescriptionStyleModel",
5344
  "model_module_version": "1.5.0",
 
5353
  "description_width": ""
5354
  }
5355
  },
5356
+ "5dfc118f189f49058104d850fcef4cfe": {
5357
  "model_module": "@jupyter-widgets/base",
5358
  "model_name": "LayoutModel",
5359
  "model_module_version": "1.2.0",
 
5405
  "width": "20px"
5406
  }
5407
  },
5408
+ "ad218808233a46b79defe021a831730d": {
5409
+ "model_module": "@jupyter-widgets/controls",
5410
+ "model_name": "ProgressStyleModel",
5411
+ "model_module_version": "1.5.0",
5412
+ "state": {
5413
+ "_model_module": "@jupyter-widgets/controls",
5414
+ "_model_module_version": "1.5.0",
5415
+ "_model_name": "ProgressStyleModel",
5416
+ "_view_count": null,
5417
+ "_view_module": "@jupyter-widgets/base",
5418
+ "_view_module_version": "1.2.0",
5419
+ "_view_name": "StyleView",
5420
+ "bar_color": null,
5421
+ "description_width": ""
5422
+ }
5423
+ },
5424
+ "4064b1e4ff5144508f4c2cf414297354": {
5425
+ "model_module": "@jupyter-widgets/base",
5426
+ "model_name": "LayoutModel",
5427
+ "model_module_version": "1.2.0",
5428
+ "state": {
5429
+ "_model_module": "@jupyter-widgets/base",
5430
+ "_model_module_version": "1.2.0",
5431
+ "_model_name": "LayoutModel",
5432
+ "_view_count": null,
5433
+ "_view_module": "@jupyter-widgets/base",
5434
+ "_view_module_version": "1.2.0",
5435
+ "_view_name": "LayoutView",
5436
+ "align_content": null,
5437
+ "align_items": null,
5438
+ "align_self": null,
5439
+ "border": null,
5440
+ "bottom": null,
5441
+ "display": null,
5442
+ "flex": null,
5443
+ "flex_flow": null,
5444
+ "grid_area": null,
5445
+ "grid_auto_columns": null,
5446
+ "grid_auto_flow": null,
5447
+ "grid_auto_rows": null,
5448
+ "grid_column": null,
5449
+ "grid_gap": null,
5450
+ "grid_row": null,
5451
+ "grid_template_areas": null,
5452
+ "grid_template_columns": null,
5453
+ "grid_template_rows": null,
5454
+ "height": null,
5455
+ "justify_content": null,
5456
+ "justify_items": null,
5457
+ "left": null,
5458
+ "margin": null,
5459
+ "max_height": null,
5460
+ "max_width": null,
5461
+ "min_height": null,
5462
+ "min_width": null,
5463
+ "object_fit": null,
5464
+ "object_position": null,
5465
+ "order": null,
5466
+ "overflow": null,
5467
+ "overflow_x": null,
5468
+ "overflow_y": null,
5469
+ "padding": null,
5470
+ "right": null,
5471
+ "top": null,
5472
+ "visibility": null,
5473
+ "width": null
5474
+ }
5475
+ },
5476
+ "e39c8e68b39549dfb33327e4b1e0cbf8": {
5477
+ "model_module": "@jupyter-widgets/controls",
5478
+ "model_name": "DescriptionStyleModel",
5479
+ "model_module_version": "1.5.0",
5480
+ "state": {
5481
+ "_model_module": "@jupyter-widgets/controls",
5482
+ "_model_module_version": "1.5.0",
5483
+ "_model_name": "DescriptionStyleModel",
5484
+ "_view_count": null,
5485
+ "_view_module": "@jupyter-widgets/base",
5486
+ "_view_module_version": "1.2.0",
5487
+ "_view_name": "StyleView",
5488
+ "description_width": ""
5489
+ }
5490
+ },
5491
+ "87e5466584114b6daf247e76b485e20b": {
5492
+ "model_module": "@jupyter-widgets/controls",
5493
+ "model_name": "HBoxModel",
5494
+ "model_module_version": "1.5.0",
5495
+ "state": {
5496
+ "_dom_classes": [],
5497
+ "_model_module": "@jupyter-widgets/controls",
5498
+ "_model_module_version": "1.5.0",
5499
+ "_model_name": "HBoxModel",
5500
+ "_view_count": null,
5501
+ "_view_module": "@jupyter-widgets/controls",
5502
+ "_view_module_version": "1.5.0",
5503
+ "_view_name": "HBoxView",
5504
+ "box_style": "",
5505
+ "children": [
5506
+ "IPY_MODEL_edc06f2c96554162844c96daf87077ea",
5507
+ "IPY_MODEL_20ad54d2b1244cbab48773a5af2ba243",
5508
+ "IPY_MODEL_c26352e2236c4e30939a21cfa1884550"
5509
+ ],
5510
+ "layout": "IPY_MODEL_412887220d7f45a2adbd530cacaced3e"
5511
+ }
5512
+ },
5513
+ "edc06f2c96554162844c96daf87077ea": {
5514
+ "model_module": "@jupyter-widgets/controls",
5515
+ "model_name": "HTMLModel",
5516
+ "model_module_version": "1.5.0",
5517
+ "state": {
5518
+ "_dom_classes": [],
5519
+ "_model_module": "@jupyter-widgets/controls",
5520
+ "_model_module_version": "1.5.0",
5521
+ "_model_name": "HTMLModel",
5522
+ "_view_count": null,
5523
+ "_view_module": "@jupyter-widgets/controls",
5524
+ "_view_module_version": "1.5.0",
5525
+ "_view_name": "HTMLView",
5526
+ "description": "",
5527
+ "description_tooltip": null,
5528
+ "layout": "IPY_MODEL_89689e97531d4f4db2937d31d0fb6538",
5529
+ "placeholder": "​",
5530
+ "style": "IPY_MODEL_846cd637017d46ee96a519e2f47a833b",
5531
+ "value": "Loading checkpoint shards:   0%"
5532
+ }
5533
+ },
5534
+ "20ad54d2b1244cbab48773a5af2ba243": {
5535
+ "model_module": "@jupyter-widgets/controls",
5536
+ "model_name": "FloatProgressModel",
5537
+ "model_module_version": "1.5.0",
5538
+ "state": {
5539
+ "_dom_classes": [],
5540
+ "_model_module": "@jupyter-widgets/controls",
5541
+ "_model_module_version": "1.5.0",
5542
+ "_model_name": "FloatProgressModel",
5543
+ "_view_count": null,
5544
+ "_view_module": "@jupyter-widgets/controls",
5545
+ "_view_module_version": "1.5.0",
5546
+ "_view_name": "ProgressView",
5547
+ "bar_style": "danger",
5548
+ "description": "",
5549
+ "description_tooltip": null,
5550
+ "layout": "IPY_MODEL_63bb7f100c464dd8bd52340fc94f51f1",
5551
+ "max": 3,
5552
+ "min": 0,
5553
+ "orientation": "horizontal",
5554
+ "style": "IPY_MODEL_1164b72288d2409aaed65050b9a9470d",
5555
+ "value": 0
5556
+ }
5557
+ },
5558
+ "c26352e2236c4e30939a21cfa1884550": {
5559
+ "model_module": "@jupyter-widgets/controls",
5560
+ "model_name": "HTMLModel",
5561
+ "model_module_version": "1.5.0",
5562
+ "state": {
5563
+ "_dom_classes": [],
5564
+ "_model_module": "@jupyter-widgets/controls",
5565
+ "_model_module_version": "1.5.0",
5566
+ "_model_name": "HTMLModel",
5567
+ "_view_count": null,
5568
+ "_view_module": "@jupyter-widgets/controls",
5569
+ "_view_module_version": "1.5.0",
5570
+ "_view_name": "HTMLView",
5571
+ "description": "",
5572
+ "description_tooltip": null,
5573
+ "layout": "IPY_MODEL_1c643ffb974849f3933cc1c52ba014e9",
5574
+ "placeholder": "​",
5575
+ "style": "IPY_MODEL_e697d39f24be4ca18f4a438b899f21eb",
5576
+ "value": " 0/3 [00:00&lt;?, ?it/s]"
5577
+ }
5578
+ },
5579
+ "412887220d7f45a2adbd530cacaced3e": {
5580
+ "model_module": "@jupyter-widgets/base",
5581
+ "model_name": "LayoutModel",
5582
+ "model_module_version": "1.2.0",
5583
+ "state": {
5584
+ "_model_module": "@jupyter-widgets/base",
5585
+ "_model_module_version": "1.2.0",
5586
+ "_model_name": "LayoutModel",
5587
+ "_view_count": null,
5588
+ "_view_module": "@jupyter-widgets/base",
5589
+ "_view_module_version": "1.2.0",
5590
+ "_view_name": "LayoutView",
5591
+ "align_content": null,
5592
+ "align_items": null,
5593
+ "align_self": null,
5594
+ "border": null,
5595
+ "bottom": null,
5596
+ "display": null,
5597
+ "flex": null,
5598
+ "flex_flow": null,
5599
+ "grid_area": null,
5600
+ "grid_auto_columns": null,
5601
+ "grid_auto_flow": null,
5602
+ "grid_auto_rows": null,
5603
+ "grid_column": null,
5604
+ "grid_gap": null,
5605
+ "grid_row": null,
5606
+ "grid_template_areas": null,
5607
+ "grid_template_columns": null,
5608
+ "grid_template_rows": null,
5609
+ "height": null,
5610
+ "justify_content": null,
5611
+ "justify_items": null,
5612
+ "left": null,
5613
+ "margin": null,
5614
+ "max_height": null,
5615
+ "max_width": null,
5616
+ "min_height": null,
5617
+ "min_width": null,
5618
+ "object_fit": null,
5619
+ "object_position": null,
5620
+ "order": null,
5621
+ "overflow": null,
5622
+ "overflow_x": null,
5623
+ "overflow_y": null,
5624
+ "padding": null,
5625
+ "right": null,
5626
+ "top": null,
5627
+ "visibility": null,
5628
+ "width": null
5629
+ }
5630
+ },
5631
+ "89689e97531d4f4db2937d31d0fb6538": {
5632
+ "model_module": "@jupyter-widgets/base",
5633
+ "model_name": "LayoutModel",
5634
+ "model_module_version": "1.2.0",
5635
+ "state": {
5636
+ "_model_module": "@jupyter-widgets/base",
5637
+ "_model_module_version": "1.2.0",
5638
+ "_model_name": "LayoutModel",
5639
+ "_view_count": null,
5640
+ "_view_module": "@jupyter-widgets/base",
5641
+ "_view_module_version": "1.2.0",
5642
+ "_view_name": "LayoutView",
5643
+ "align_content": null,
5644
+ "align_items": null,
5645
+ "align_self": null,
5646
+ "border": null,
5647
+ "bottom": null,
5648
+ "display": null,
5649
+ "flex": null,
5650
+ "flex_flow": null,
5651
+ "grid_area": null,
5652
+ "grid_auto_columns": null,
5653
+ "grid_auto_flow": null,
5654
+ "grid_auto_rows": null,
5655
+ "grid_column": null,
5656
+ "grid_gap": null,
5657
+ "grid_row": null,
5658
+ "grid_template_areas": null,
5659
+ "grid_template_columns": null,
5660
+ "grid_template_rows": null,
5661
+ "height": null,
5662
+ "justify_content": null,
5663
+ "justify_items": null,
5664
+ "left": null,
5665
+ "margin": null,
5666
+ "max_height": null,
5667
+ "max_width": null,
5668
+ "min_height": null,
5669
+ "min_width": null,
5670
+ "object_fit": null,
5671
+ "object_position": null,
5672
+ "order": null,
5673
+ "overflow": null,
5674
+ "overflow_x": null,
5675
+ "overflow_y": null,
5676
+ "padding": null,
5677
+ "right": null,
5678
+ "top": null,
5679
+ "visibility": null,
5680
+ "width": null
5681
+ }
5682
+ },
5683
+ "846cd637017d46ee96a519e2f47a833b": {
5684
+ "model_module": "@jupyter-widgets/controls",
5685
+ "model_name": "DescriptionStyleModel",
5686
+ "model_module_version": "1.5.0",
5687
+ "state": {
5688
+ "_model_module": "@jupyter-widgets/controls",
5689
+ "_model_module_version": "1.5.0",
5690
+ "_model_name": "DescriptionStyleModel",
5691
+ "_view_count": null,
5692
+ "_view_module": "@jupyter-widgets/base",
5693
+ "_view_module_version": "1.2.0",
5694
+ "_view_name": "StyleView",
5695
+ "description_width": ""
5696
+ }
5697
+ },
5698
+ "63bb7f100c464dd8bd52340fc94f51f1": {
5699
+ "model_module": "@jupyter-widgets/base",
5700
+ "model_name": "LayoutModel",
5701
+ "model_module_version": "1.2.0",
5702
+ "state": {
5703
+ "_model_module": "@jupyter-widgets/base",
5704
+ "_model_module_version": "1.2.0",
5705
+ "_model_name": "LayoutModel",
5706
+ "_view_count": null,
5707
+ "_view_module": "@jupyter-widgets/base",
5708
+ "_view_module_version": "1.2.0",
5709
+ "_view_name": "LayoutView",
5710
+ "align_content": null,
5711
+ "align_items": null,
5712
+ "align_self": null,
5713
+ "border": null,
5714
+ "bottom": null,
5715
+ "display": null,
5716
+ "flex": null,
5717
+ "flex_flow": null,
5718
+ "grid_area": null,
5719
+ "grid_auto_columns": null,
5720
+ "grid_auto_flow": null,
5721
+ "grid_auto_rows": null,
5722
+ "grid_column": null,
5723
+ "grid_gap": null,
5724
+ "grid_row": null,
5725
+ "grid_template_areas": null,
5726
+ "grid_template_columns": null,
5727
+ "grid_template_rows": null,
5728
+ "height": null,
5729
+ "justify_content": null,
5730
+ "justify_items": null,
5731
+ "left": null,
5732
+ "margin": null,
5733
+ "max_height": null,
5734
+ "max_width": null,
5735
+ "min_height": null,
5736
+ "min_width": null,
5737
+ "object_fit": null,
5738
+ "object_position": null,
5739
+ "order": null,
5740
+ "overflow": null,
5741
+ "overflow_x": null,
5742
+ "overflow_y": null,
5743
+ "padding": null,
5744
+ "right": null,
5745
+ "top": null,
5746
+ "visibility": null,
5747
+ "width": null
5748
+ }
5749
+ },
5750
+ "1164b72288d2409aaed65050b9a9470d": {
5751
  "model_module": "@jupyter-widgets/controls",
5752
  "model_name": "ProgressStyleModel",
5753
  "model_module_version": "1.5.0",
 
5763
  "description_width": ""
5764
  }
5765
  },
5766
+ "1c643ffb974849f3933cc1c52ba014e9": {
5767
  "model_module": "@jupyter-widgets/base",
5768
  "model_name": "LayoutModel",
5769
  "model_module_version": "1.2.0",
 
5815
  "width": null
5816
  }
5817
  },
5818
+ "e697d39f24be4ca18f4a438b899f21eb": {
5819
  "model_module": "@jupyter-widgets/controls",
5820
  "model_name": "DescriptionStyleModel",
5821
  "model_module_version": "1.5.0",
 
6669
  "metadata": {
6670
  "colab": {
6671
  "base_uri": "https://localhost:8080/",
6672
+ "height": 803,
6673
  "referenced_widgets": [
6674
+ "b2d96c62ece74d10ae8cfa0368bdef5d",
6675
+ "026549e161b746819e82057daa34d013",
6676
+ "5e7403e444914be28ff4dffea6b0e223",
6677
+ "8a47ce5909fa46ab96d5b289c35cb3c2",
6678
+ "dcb0c08779074052a98d87804be0ffbc",
6679
+ "e02027bec5214982b5c51a556935799e",
6680
+ "2d46faefa76e4f03903d970edcab8e6b",
6681
+ "252ee04b367841778ae4c89a84c5f1de",
6682
+ "ad5d4df02464404d80de57028d815692",
6683
+ "c7b6596488a04171b96271bb41a918ca",
6684
+ "dce80ab74a6d41afbeb65708f855edb5",
6685
+ "2bc646b6c1224558b1513c2e8d3aeec4",
6686
+ "5eae870a01094dc2a79a1e9580ecd0e3",
6687
+ "aae3998d02b542349a0d63efdc796f5f",
6688
+ "db3eb513d928461cb9f29c7a81a70eef",
6689
+ "6b9b92000d0243669e0b4488aa490109",
6690
+ "1a24e8e6ef0c4181831de003c8576d88",
6691
+ "66d73112d71d441f9b87cac7169491f8",
6692
+ "8b46745fb1764422869c83b231197585",
6693
+ "05b38f4f3a97411495f7678a938fd371",
6694
+ "f0942e71542048a49ee438966bac45ac",
6695
+ "ae73e40ccac5442494b570893f5e1d23",
6696
+ "8c53093a52d249a4b10e8dad950aef62",
6697
+ "24d3d9a8ea6a4303be819fde09d698e6",
6698
+ "804b4627bb59452b8d97a304a0beaa99",
6699
+ "12cd9edc9fd844d09a20bd61e359da61",
6700
+ "410df68c5f5a48c8b5d7a6d7f0f3f0ee",
6701
+ "3b0bd0450cf440819aa6b56243d86719",
6702
+ "bafb910ffc8542e0a4a82ac2c5541b0b",
6703
+ "654e38a251db4c54a0cab8358e08ae54",
6704
+ "8193406afd25421b8d7125a3d694f7ee",
6705
+ "ca7a2197dff34c8696f38de9eb483101",
6706
+ "5682a9e270a84eb3a137ba6c454e754e",
6707
+ "d2ea7cdbe39f421eac88fd60c07832aa",
6708
+ "3aad576dd5e044479ee1bc791098be6e",
6709
+ "aee48a66747c4b49ab797f51fabb81dd",
6710
+ "4cae1daba91a4a89a7a9dcb1196c1ff7",
6711
+ "b39a87f5da9241b08b203cb9e5d1ce68",
6712
+ "8352137c9363487cb401a11fb5982525",
6713
+ "486195810e3541d983e47541fba191ca",
6714
+ "a258a629af19449a9491965645d4b79f",
6715
+ "40681743310747cd833de001a3f23c95",
6716
+ "281a36b73f884585bd5f2693409bfdc0",
6717
+ "8fa74caaaa9b4074927c483173e7483e",
6718
+ "0517d3ca8f754dda9c05c58df468f389",
6719
+ "36255a6081fb4f5890671a5b134d2a88",
6720
+ "91af530b9b00467d8ffe60f53d1ed3f7",
6721
+ "6c5eec9d403d4852a914ec14856842d2",
6722
+ "e9ed79822b28466cb6e987928d3217ac",
6723
+ "ebe0443397974147b3845cc9e9aa20e7",
6724
+ "dd8ffc95d9074bf78bcb6a3b656fdf8d",
6725
+ "5cb9185af5694c28b2e0e314539c6aed",
6726
+ "b058573d771f4642b62d41ff16e0a668",
6727
+ "f32f3cc12fa742f598781ab674db1b72",
6728
+ "980b0da3463c4f8ba6afb7b25814c9fd",
6729
+ "b4dbd23ca854403b98b3550f10672c3d",
6730
+ "7fb9acd8bf0c495baec3ee9710bbb83d",
6731
+ "1198981dbe814b998b1ec872a7429910",
6732
+ "ed1e88050a704cd89810b3e7aa5aa3ff",
6733
+ "d6a29cbf2da04b6cbc8fddef4ed90189",
6734
+ "d7e48b4cfc5b4effaa560d645a6d5ce1",
6735
+ "8447bf99e9c6467f93b3937d0dcdceee",
6736
+ "424d45e11fd74590be78c9c8340ace40",
6737
+ "940723bf0502461a8804999207eda050",
6738
+ "9d6faeb02b2a4195a2c3975d81050c86",
6739
+ "70de2bd915c040e499d2165ab44c8b87",
6740
+ "067b7146c43d409d8279ba5f1add3d37",
6741
+ "212e1703f3234410b6b4babb3fcdff31",
6742
+ "17f7e5c1bcbe4c1fbf1d9e5a68c88174",
6743
+ "38a0b812722446a0adfdf432d178bca3",
6744
+ "8412d6436c234fb2b0fbe4c6109bcc11",
6745
+ "d161beab3f8c4ed3b7e1e99a50e0d682",
6746
+ "1a2d30a8995e4de5bc16f9c77723cc14",
6747
+ "a50c1c8ef59641a096560837ad19102d",
6748
+ "6ac5b6703d3b4764a4024d529663c4bb",
6749
+ "22ae462317594dedaf012ba3baa5feb5",
6750
+ "e4b83d48686c4850ac698602ab9d6ae5",
6751
+ "96eab2db9f1c47e3be7f05e17dd4bc2e",
6752
+ "bac648fd4d524113acc6dc6935080b7d",
6753
+ "bbf592fa8a9a47f4a1ca4cce63d1de5b",
6754
+ "520912d0ea104132abe22ceda62df8df",
6755
+ "0eccb66584b84bb496e2897fb7336893",
6756
+ "6ebbe27bf2fa4f939e374b414efa74f3",
6757
+ "81673221a8194854b93519890687c6b3",
6758
+ "5dfc118f189f49058104d850fcef4cfe",
6759
+ "ad218808233a46b79defe021a831730d",
6760
+ "4064b1e4ff5144508f4c2cf414297354",
6761
+ "e39c8e68b39549dfb33327e4b1e0cbf8",
6762
+ "87e5466584114b6daf247e76b485e20b",
6763
+ "edc06f2c96554162844c96daf87077ea",
6764
+ "20ad54d2b1244cbab48773a5af2ba243",
6765
+ "c26352e2236c4e30939a21cfa1884550",
6766
+ "412887220d7f45a2adbd530cacaced3e",
6767
+ "89689e97531d4f4db2937d31d0fb6538",
6768
+ "846cd637017d46ee96a519e2f47a833b",
6769
+ "63bb7f100c464dd8bd52340fc94f51f1",
6770
+ "1164b72288d2409aaed65050b9a9470d",
6771
+ "1c643ffb974849f3933cc1c52ba014e9",
6772
+ "e697d39f24be4ca18f4a438b899f21eb"
6773
  ]
6774
  },
6775
  "id": "d97388b1",
6776
+ "outputId": "3bd82301-029f-4ab0-ab24-23f0040c29c6"
6777
  },
6778
  "source": [
6779
  "from huggingface_hub import snapshot_download\n",
 
6810
  "print(f\"SDNQ Model device: {next(sdnq_model.parameters()).device}\")\n",
6811
  "print(f\"SDNQ Model dtype: {next(sdnq_model.parameters()).dtype}\")"
6812
  ],
6813
+ "execution_count": 8,
6814
  "outputs": [
6815
  {
6816
  "output_type": "stream",
 
6823
  "output_type": "display_data",
6824
  "data": {
6825
  "text/plain": [
6826
+ "Fetching 17 files: 0%| | 0/17 [00:00<?, ?it/s]"
6827
+ ],
6828
+ "application/vnd.jupyter.widget-view+json": {
6829
+ "version_major": 2,
6830
+ "version_minor": 0,
6831
+ "model_id": "b2d96c62ece74d10ae8cfa0368bdef5d"
6832
+ }
6833
+ },
6834
+ "metadata": {}
6835
+ },
6836
+ {
6837
+ "output_type": "display_data",
6838
+ "data": {
6839
+ "text/plain": [
6840
+ "chat_template.json: 0.00B [00:00, ?B/s]"
6841
  ],
6842
  "application/vnd.jupyter.widget-view+json": {
6843
  "version_major": 2,
6844
  "version_minor": 0,
6845
+ "model_id": "2bc646b6c1224558b1513c2e8d3aeec4"
6846
  }
6847
  },
6848
  "metadata": {}
 
6851
  "output_type": "display_data",
6852
  "data": {
6853
  "text/plain": [
6854
+ "merges.txt: 0.00B [00:00, ?B/s]"
6855
  ],
6856
  "application/vnd.jupyter.widget-view+json": {
6857
  "version_major": 2,
6858
  "version_minor": 0,
6859
+ "model_id": "8c53093a52d249a4b10e8dad950aef62"
6860
  }
6861
  },
6862
  "metadata": {}
 
6865
  "output_type": "display_data",
6866
  "data": {
6867
  "text/plain": [
6868
+ "generation_config.json: 0%| | 0.00/269 [00:00<?, ?B/s]"
6869
  ],
6870
  "application/vnd.jupyter.widget-view+json": {
6871
  "version_major": 2,
6872
  "version_minor": 0,
6873
+ "model_id": "d2ea7cdbe39f421eac88fd60c07832aa"
6874
  }
6875
  },
6876
  "metadata": {}
 
6879
  "output_type": "display_data",
6880
  "data": {
6881
  "text/plain": [
6882
+ "configuration.json: 0%| | 0.00/73.0 [00:00<?, ?B/s]"
6883
  ],
6884
  "application/vnd.jupyter.widget-view+json": {
6885
  "version_major": 2,
6886
  "version_minor": 0,
6887
+ "model_id": "0517d3ca8f754dda9c05c58df468f389"
6888
  }
6889
  },
6890
  "metadata": {}
 
6893
  "output_type": "display_data",
6894
  "data": {
6895
  "text/plain": [
6896
+ "tokenizer.json: 0.00B [00:00, ?B/s]"
6897
  ],
6898
  "application/vnd.jupyter.widget-view+json": {
6899
  "version_major": 2,
6900
  "version_minor": 0,
6901
+ "model_id": "b4dbd23ca854403b98b3550f10672c3d"
6902
  }
6903
  },
6904
  "metadata": {}
 
6907
  "output_type": "display_data",
6908
  "data": {
6909
  "text/plain": [
6910
+ "tokenizer_config.json: 0.00B [00:00, ?B/s]"
6911
  ],
6912
  "application/vnd.jupyter.widget-view+json": {
6913
  "version_major": 2,
6914
  "version_minor": 0,
6915
+ "model_id": "067b7146c43d409d8279ba5f1add3d37"
6916
  }
6917
  },
6918
  "metadata": {}
 
6921
  "output_type": "display_data",
6922
  "data": {
6923
  "text/plain": [
6924
+ "vocab.json: 0.00B [00:00, ?B/s]"
6925
  ],
6926
  "application/vnd.jupyter.widget-view+json": {
6927
  "version_major": 2,
6928
  "version_minor": 0,
6929
+ "model_id": "96eab2db9f1c47e3be7f05e17dd4bc2e"
6930
  }
6931
  },
6932
  "metadata": {}
6933
  },
6934
+ {
6935
+ "output_type": "stream",
6936
+ "name": "stdout",
6937
+ "text": [
6938
+ "✅ SDNQ model downloaded.\n",
6939
+ "Loading processor for SDNQ model...\n"
6940
+ ]
6941
+ },
6942
+ {
6943
+ "output_type": "stream",
6944
+ "name": "stderr",
6945
+ "text": [
6946
+ "`torch_dtype` is deprecated! Use `dtype` instead!\n",
6947
+ "Unknown quantization type, got sdnq - supported types are: ['awq', 'bitsandbytes_4bit', 'bitsandbytes_8bit', 'gptq', 'aqlm', 'quanto', 'quark', 'fp_quant', 'eetq', 'higgs', 'hqq', 'compressed-tensors', 'fbgemm_fp8', 'torchao', 'bitnet', 'vptq', 'spqr', 'fp8', 'auto-round', 'mxfp4']. Hence, we will skip the quantization. To remove the warning, you can delete the quantization_config attribute in config.json\n"
6948
+ ]
6949
+ },
6950
+ {
6951
+ "output_type": "stream",
6952
+ "name": "stdout",
6953
+ "text": [
6954
+ "Loading SDNQ model...\n"
6955
+ ]
6956
+ },
6957
  {
6958
  "output_type": "display_data",
6959
  "data": {
6960
  "text/plain": [
6961
+ "Loading checkpoint shards: 0%| | 0/3 [00:00<?, ?it/s]"
6962
  ],
6963
  "application/vnd.jupyter.widget-view+json": {
6964
  "version_major": 2,
6965
  "version_minor": 0,
6966
+ "model_id": "87e5466584114b6daf247e76b485e20b"
6967
  }
6968
  },
6969
  "metadata": {}
6970
+ },
6971
+ {
6972
+ "output_type": "error",
6973
+ "ename": "RuntimeError",
6974
+ "evalue": "Error(s) in loading state_dict for Linear:\n\tsize mismatch for weight: copying a param with shape torch.Size([6291456, 5]) from checkpoint, the shape in current model is torch.Size([4096, 12288]).",
6975
+ "traceback": [
6976
+ "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
6977
+ "\u001b[0;31mRuntimeError\u001b[0m Traceback (most recent call last)",
6978
+ "\u001b[0;32m/tmp/ipykernel_3788/3308593350.py\u001b[0m in \u001b[0;36m<cell line: 0>\u001b[0;34m()\u001b[0m\n\u001b[1;32m 21\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 22\u001b[0m \u001b[0mprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"Loading SDNQ model...\"\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 23\u001b[0;31m sdnq_model = Qwen3VLForConditionalGeneration.from_pretrained(\n\u001b[0m\u001b[1;32m 24\u001b[0m \u001b[0msdnq_local_download_path\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 25\u001b[0m \u001b[0mtorch_dtype\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mtorch\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfloat32\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;31m# Ensure correct dtype if needed\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
6979
+ "\u001b[0;32m/usr/local/lib/python3.12/dist-packages/transformers/modeling_utils.py\u001b[0m in \u001b[0;36m_wrapper\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m 275\u001b[0m \u001b[0mold_dtype\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtorch\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mget_default_dtype\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 276\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 277\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mfunc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 278\u001b[0m \u001b[0;32mfinally\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 279\u001b[0m \u001b[0mtorch\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mset_default_dtype\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mold_dtype\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
6980
+ "\u001b[0;32m/usr/local/lib/python3.12/dist-packages/transformers/modeling_utils.py\u001b[0m in \u001b[0;36mfrom_pretrained\u001b[0;34m(cls, pretrained_model_name_or_path, config, cache_dir, ignore_mismatched_sizes, force_download, local_files_only, token, revision, use_safetensors, weights_only, *model_args, **kwargs)\u001b[0m\n\u001b[1;32m 5046\u001b[0m \u001b[0moffload_index\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 5047\u001b[0m \u001b[0merror_msgs\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 5048\u001b[0;31m \u001b[0;34m)\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mcls\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_load_pretrained_model\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 5049\u001b[0m \u001b[0mmodel\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 5050\u001b[0m \u001b[0mstate_dict\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
6981
+ "\u001b[0;32m/usr/local/lib/python3.12/dist-packages/transformers/modeling_utils.py\u001b[0m in \u001b[0;36m_load_pretrained_model\u001b[0;34m(cls, model, state_dict, checkpoint_files, pretrained_model_name_or_path, ignore_mismatched_sizes, sharded_metadata, device_map, disk_offload_folder, dtype, hf_quantizer, keep_in_fp32_regex, device_mesh, key_mapping, weights_only)\u001b[0m\n\u001b[1;32m 5466\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 5467\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0margs\u001b[0m \u001b[0;32min\u001b[0m \u001b[0margs_list\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 5468\u001b[0;31m \u001b[0m_error_msgs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdisk_offload_index\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mload_shard_file\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 5469\u001b[0m \u001b[0merror_msgs\u001b[0m \u001b[0;34m+=\u001b[0m \u001b[0m_error_msgs\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 5470\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
6982
+ "\u001b[0;32m/usr/local/lib/python3.12/dist-packages/transformers/modeling_utils.py\u001b[0m in \u001b[0;36mload_shard_file\u001b[0;34m(args)\u001b[0m\n\u001b[1;32m 841\u001b[0m \u001b[0;31m# Skip it with fsdp on ranks other than 0\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 842\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;34m(\u001b[0m\u001b[0mis_fsdp_enabled\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mis_local_dist_rank_0\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mis_quantized\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 843\u001b[0;31m disk_offload_index = _load_state_dict_into_meta_model(\n\u001b[0m\u001b[1;32m 844\u001b[0m \u001b[0mmodel\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 845\u001b[0m \u001b[0mstate_dict\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
6983
+ "\u001b[0;32m/usr/local/lib/python3.12/dist-packages/torch/utils/_contextlib.py\u001b[0m in \u001b[0;36mdecorate_context\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m 122\u001b[0m \u001b[0;31m# pyrefly: ignore [bad-context-manager]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 123\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mctx_factory\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 124\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mfunc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 125\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 126\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mdecorate_context\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
6984
+ "\u001b[0;32m/usr/local/lib/python3.12/dist-packages/transformers/modeling_utils.py\u001b[0m in \u001b[0;36m_load_state_dict_into_meta_model\u001b[0;34m(model, state_dict, shard_file, reverse_renaming_mapping, device_map, disk_offload_folder, disk_offload_index, hf_quantizer, keep_in_fp32_regex, device_mesh)\u001b[0m\n\u001b[1;32m 768\u001b[0m \u001b[0mparam_device\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m\"cpu\"\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mis_local_dist_rank_0\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32melse\u001b[0m \u001b[0;34m\"meta\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 769\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 770\u001b[0;31m \u001b[0m_load_parameter_into_model\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mparam_name\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mparam\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mparam_device\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 771\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 772\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
6985
+ "\u001b[0;32m/usr/local/lib/python3.12/dist-packages/transformers/modeling_utils.py\u001b[0m in \u001b[0;36m_load_parameter_into_model\u001b[0;34m(model, param_name, tensor)\u001b[0m\n\u001b[1;32m 665\u001b[0m \u001b[0mmodule\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mparam_type\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mget_module_from_name\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mparam_name\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 666\u001b[0m \u001b[0;31m# This will check potential shape mismatch if skipped before\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 667\u001b[0;31m \u001b[0mmodule\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mload_state_dict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m{\u001b[0m\u001b[0mparam_type\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mtensor\u001b[0m\u001b[0;34m}\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mstrict\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mFalse\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0massign\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 668\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 669\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
6986
+ "\u001b[0;32m/usr/local/lib/python3.12/dist-packages/torch/nn/modules/module.py\u001b[0m in \u001b[0;36mload_state_dict\u001b[0;34m(self, state_dict, strict, assign)\u001b[0m\n\u001b[1;32m 2633\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 2634\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mlen\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0merror_msgs\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m>\u001b[0m \u001b[0;36m0\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 2635\u001b[0;31m raise RuntimeError(\n\u001b[0m\u001b[1;32m 2636\u001b[0m \"Error(s) in loading state_dict for {}:\\n\\t{}\".format(\n\u001b[1;32m 2637\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m__class__\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m__name__\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m\"\\n\\t\"\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mjoin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0merror_msgs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
6987
+ "\u001b[0;31mRuntimeError\u001b[0m: Error(s) in loading state_dict for Linear:\n\tsize mismatch for weight: copying a param with shape torch.Size([6291456, 5]) from checkpoint, the shape in current model is torch.Size([4096, 12288])."
6988
+ ]
6989
  }
6990
  ]
6991
  },