chansung commited on
Commit
ffa8b2a
·
1 Parent(s): 1eb06e4

Upload alpacagpt4-lora-7b.ipynb

Browse files
Files changed (1) hide show
  1. alpacagpt4-lora-7b.ipynb +1523 -0
alpacagpt4-lora-7b.ipynb ADDED
@@ -0,0 +1,1523 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "nbformat": 4,
3
+ "nbformat_minor": 0,
4
+ "metadata": {
5
+ "colab": {
6
+ "provenance": [],
7
+ "machine_shape": "hm"
8
+ },
9
+ "kernelspec": {
10
+ "name": "python3",
11
+ "display_name": "Python 3"
12
+ },
13
+ "language_info": {
14
+ "name": "python"
15
+ },
16
+ "accelerator": "GPU",
17
+ "gpuClass": "standard",
18
+ "widgets": {
19
+ "application/vnd.jupyter.widget-state+json": {
20
+ "f0a180029cfc4c59b80697222ffc804e": {
21
+ "model_module": "@jupyter-widgets/controls",
22
+ "model_name": "HBoxModel",
23
+ "model_module_version": "1.5.0",
24
+ "state": {
25
+ "_dom_classes": [],
26
+ "_model_module": "@jupyter-widgets/controls",
27
+ "_model_module_version": "1.5.0",
28
+ "_model_name": "HBoxModel",
29
+ "_view_count": null,
30
+ "_view_module": "@jupyter-widgets/controls",
31
+ "_view_module_version": "1.5.0",
32
+ "_view_name": "HBoxView",
33
+ "box_style": "",
34
+ "children": [
35
+ "IPY_MODEL_e608b9052a6d4e2491eb3b63dc7c8d03",
36
+ "IPY_MODEL_36c64a38fd804214b83c0b2645f5a5ca",
37
+ "IPY_MODEL_dfd3e291cb1b47938bba1d240c2915ab"
38
+ ],
39
+ "layout": "IPY_MODEL_a991ae67d77b4dd4ae30e6ac0e899be1"
40
+ }
41
+ },
42
+ "e608b9052a6d4e2491eb3b63dc7c8d03": {
43
+ "model_module": "@jupyter-widgets/controls",
44
+ "model_name": "HTMLModel",
45
+ "model_module_version": "1.5.0",
46
+ "state": {
47
+ "_dom_classes": [],
48
+ "_model_module": "@jupyter-widgets/controls",
49
+ "_model_module_version": "1.5.0",
50
+ "_model_name": "HTMLModel",
51
+ "_view_count": null,
52
+ "_view_module": "@jupyter-widgets/controls",
53
+ "_view_module_version": "1.5.0",
54
+ "_view_name": "HTMLView",
55
+ "description": "",
56
+ "description_tooltip": null,
57
+ "layout": "IPY_MODEL_8dfa9dd2f1b14615be5c00949dcbb318",
58
+ "placeholder": "​",
59
+ "style": "IPY_MODEL_8f2b68c72f4e41f98b42365561addef3",
60
+ "value": "Loading checkpoint shards: 100%"
61
+ }
62
+ },
63
+ "36c64a38fd804214b83c0b2645f5a5ca": {
64
+ "model_module": "@jupyter-widgets/controls",
65
+ "model_name": "FloatProgressModel",
66
+ "model_module_version": "1.5.0",
67
+ "state": {
68
+ "_dom_classes": [],
69
+ "_model_module": "@jupyter-widgets/controls",
70
+ "_model_module_version": "1.5.0",
71
+ "_model_name": "FloatProgressModel",
72
+ "_view_count": null,
73
+ "_view_module": "@jupyter-widgets/controls",
74
+ "_view_module_version": "1.5.0",
75
+ "_view_name": "ProgressView",
76
+ "bar_style": "success",
77
+ "description": "",
78
+ "description_tooltip": null,
79
+ "layout": "IPY_MODEL_a5f11527f2eb407ea3c702416d6e8f04",
80
+ "max": 2,
81
+ "min": 0,
82
+ "orientation": "horizontal",
83
+ "style": "IPY_MODEL_47c9e6973fe949f9951fb2d7e725dd43",
84
+ "value": 2
85
+ }
86
+ },
87
+ "dfd3e291cb1b47938bba1d240c2915ab": {
88
+ "model_module": "@jupyter-widgets/controls",
89
+ "model_name": "HTMLModel",
90
+ "model_module_version": "1.5.0",
91
+ "state": {
92
+ "_dom_classes": [],
93
+ "_model_module": "@jupyter-widgets/controls",
94
+ "_model_module_version": "1.5.0",
95
+ "_model_name": "HTMLModel",
96
+ "_view_count": null,
97
+ "_view_module": "@jupyter-widgets/controls",
98
+ "_view_module_version": "1.5.0",
99
+ "_view_name": "HTMLView",
100
+ "description": "",
101
+ "description_tooltip": null,
102
+ "layout": "IPY_MODEL_454bcb8132ba4024ba69f93374525765",
103
+ "placeholder": "​",
104
+ "style": "IPY_MODEL_a4db771090f74fb995c6e78ed0e9b9c8",
105
+ "value": " 2/2 [00:58<00:00, 26.95s/it]"
106
+ }
107
+ },
108
+ "a991ae67d77b4dd4ae30e6ac0e899be1": {
109
+ "model_module": "@jupyter-widgets/base",
110
+ "model_name": "LayoutModel",
111
+ "model_module_version": "1.2.0",
112
+ "state": {
113
+ "_model_module": "@jupyter-widgets/base",
114
+ "_model_module_version": "1.2.0",
115
+ "_model_name": "LayoutModel",
116
+ "_view_count": null,
117
+ "_view_module": "@jupyter-widgets/base",
118
+ "_view_module_version": "1.2.0",
119
+ "_view_name": "LayoutView",
120
+ "align_content": null,
121
+ "align_items": null,
122
+ "align_self": null,
123
+ "border": null,
124
+ "bottom": null,
125
+ "display": null,
126
+ "flex": null,
127
+ "flex_flow": null,
128
+ "grid_area": null,
129
+ "grid_auto_columns": null,
130
+ "grid_auto_flow": null,
131
+ "grid_auto_rows": null,
132
+ "grid_column": null,
133
+ "grid_gap": null,
134
+ "grid_row": null,
135
+ "grid_template_areas": null,
136
+ "grid_template_columns": null,
137
+ "grid_template_rows": null,
138
+ "height": null,
139
+ "justify_content": null,
140
+ "justify_items": null,
141
+ "left": null,
142
+ "margin": null,
143
+ "max_height": null,
144
+ "max_width": null,
145
+ "min_height": null,
146
+ "min_width": null,
147
+ "object_fit": null,
148
+ "object_position": null,
149
+ "order": null,
150
+ "overflow": null,
151
+ "overflow_x": null,
152
+ "overflow_y": null,
153
+ "padding": null,
154
+ "right": null,
155
+ "top": null,
156
+ "visibility": null,
157
+ "width": null
158
+ }
159
+ },
160
+ "8dfa9dd2f1b14615be5c00949dcbb318": {
161
+ "model_module": "@jupyter-widgets/base",
162
+ "model_name": "LayoutModel",
163
+ "model_module_version": "1.2.0",
164
+ "state": {
165
+ "_model_module": "@jupyter-widgets/base",
166
+ "_model_module_version": "1.2.0",
167
+ "_model_name": "LayoutModel",
168
+ "_view_count": null,
169
+ "_view_module": "@jupyter-widgets/base",
170
+ "_view_module_version": "1.2.0",
171
+ "_view_name": "LayoutView",
172
+ "align_content": null,
173
+ "align_items": null,
174
+ "align_self": null,
175
+ "border": null,
176
+ "bottom": null,
177
+ "display": null,
178
+ "flex": null,
179
+ "flex_flow": null,
180
+ "grid_area": null,
181
+ "grid_auto_columns": null,
182
+ "grid_auto_flow": null,
183
+ "grid_auto_rows": null,
184
+ "grid_column": null,
185
+ "grid_gap": null,
186
+ "grid_row": null,
187
+ "grid_template_areas": null,
188
+ "grid_template_columns": null,
189
+ "grid_template_rows": null,
190
+ "height": null,
191
+ "justify_content": null,
192
+ "justify_items": null,
193
+ "left": null,
194
+ "margin": null,
195
+ "max_height": null,
196
+ "max_width": null,
197
+ "min_height": null,
198
+ "min_width": null,
199
+ "object_fit": null,
200
+ "object_position": null,
201
+ "order": null,
202
+ "overflow": null,
203
+ "overflow_x": null,
204
+ "overflow_y": null,
205
+ "padding": null,
206
+ "right": null,
207
+ "top": null,
208
+ "visibility": null,
209
+ "width": null
210
+ }
211
+ },
212
+ "8f2b68c72f4e41f98b42365561addef3": {
213
+ "model_module": "@jupyter-widgets/controls",
214
+ "model_name": "DescriptionStyleModel",
215
+ "model_module_version": "1.5.0",
216
+ "state": {
217
+ "_model_module": "@jupyter-widgets/controls",
218
+ "_model_module_version": "1.5.0",
219
+ "_model_name": "DescriptionStyleModel",
220
+ "_view_count": null,
221
+ "_view_module": "@jupyter-widgets/base",
222
+ "_view_module_version": "1.2.0",
223
+ "_view_name": "StyleView",
224
+ "description_width": ""
225
+ }
226
+ },
227
+ "a5f11527f2eb407ea3c702416d6e8f04": {
228
+ "model_module": "@jupyter-widgets/base",
229
+ "model_name": "LayoutModel",
230
+ "model_module_version": "1.2.0",
231
+ "state": {
232
+ "_model_module": "@jupyter-widgets/base",
233
+ "_model_module_version": "1.2.0",
234
+ "_model_name": "LayoutModel",
235
+ "_view_count": null,
236
+ "_view_module": "@jupyter-widgets/base",
237
+ "_view_module_version": "1.2.0",
238
+ "_view_name": "LayoutView",
239
+ "align_content": null,
240
+ "align_items": null,
241
+ "align_self": null,
242
+ "border": null,
243
+ "bottom": null,
244
+ "display": null,
245
+ "flex": null,
246
+ "flex_flow": null,
247
+ "grid_area": null,
248
+ "grid_auto_columns": null,
249
+ "grid_auto_flow": null,
250
+ "grid_auto_rows": null,
251
+ "grid_column": null,
252
+ "grid_gap": null,
253
+ "grid_row": null,
254
+ "grid_template_areas": null,
255
+ "grid_template_columns": null,
256
+ "grid_template_rows": null,
257
+ "height": null,
258
+ "justify_content": null,
259
+ "justify_items": null,
260
+ "left": null,
261
+ "margin": null,
262
+ "max_height": null,
263
+ "max_width": null,
264
+ "min_height": null,
265
+ "min_width": null,
266
+ "object_fit": null,
267
+ "object_position": null,
268
+ "order": null,
269
+ "overflow": null,
270
+ "overflow_x": null,
271
+ "overflow_y": null,
272
+ "padding": null,
273
+ "right": null,
274
+ "top": null,
275
+ "visibility": null,
276
+ "width": null
277
+ }
278
+ },
279
+ "47c9e6973fe949f9951fb2d7e725dd43": {
280
+ "model_module": "@jupyter-widgets/controls",
281
+ "model_name": "ProgressStyleModel",
282
+ "model_module_version": "1.5.0",
283
+ "state": {
284
+ "_model_module": "@jupyter-widgets/controls",
285
+ "_model_module_version": "1.5.0",
286
+ "_model_name": "ProgressStyleModel",
287
+ "_view_count": null,
288
+ "_view_module": "@jupyter-widgets/base",
289
+ "_view_module_version": "1.2.0",
290
+ "_view_name": "StyleView",
291
+ "bar_color": null,
292
+ "description_width": ""
293
+ }
294
+ },
295
+ "454bcb8132ba4024ba69f93374525765": {
296
+ "model_module": "@jupyter-widgets/base",
297
+ "model_name": "LayoutModel",
298
+ "model_module_version": "1.2.0",
299
+ "state": {
300
+ "_model_module": "@jupyter-widgets/base",
301
+ "_model_module_version": "1.2.0",
302
+ "_model_name": "LayoutModel",
303
+ "_view_count": null,
304
+ "_view_module": "@jupyter-widgets/base",
305
+ "_view_module_version": "1.2.0",
306
+ "_view_name": "LayoutView",
307
+ "align_content": null,
308
+ "align_items": null,
309
+ "align_self": null,
310
+ "border": null,
311
+ "bottom": null,
312
+ "display": null,
313
+ "flex": null,
314
+ "flex_flow": null,
315
+ "grid_area": null,
316
+ "grid_auto_columns": null,
317
+ "grid_auto_flow": null,
318
+ "grid_auto_rows": null,
319
+ "grid_column": null,
320
+ "grid_gap": null,
321
+ "grid_row": null,
322
+ "grid_template_areas": null,
323
+ "grid_template_columns": null,
324
+ "grid_template_rows": null,
325
+ "height": null,
326
+ "justify_content": null,
327
+ "justify_items": null,
328
+ "left": null,
329
+ "margin": null,
330
+ "max_height": null,
331
+ "max_width": null,
332
+ "min_height": null,
333
+ "min_width": null,
334
+ "object_fit": null,
335
+ "object_position": null,
336
+ "order": null,
337
+ "overflow": null,
338
+ "overflow_x": null,
339
+ "overflow_y": null,
340
+ "padding": null,
341
+ "right": null,
342
+ "top": null,
343
+ "visibility": null,
344
+ "width": null
345
+ }
346
+ },
347
+ "a4db771090f74fb995c6e78ed0e9b9c8": {
348
+ "model_module": "@jupyter-widgets/controls",
349
+ "model_name": "DescriptionStyleModel",
350
+ "model_module_version": "1.5.0",
351
+ "state": {
352
+ "_model_module": "@jupyter-widgets/controls",
353
+ "_model_module_version": "1.5.0",
354
+ "_model_name": "DescriptionStyleModel",
355
+ "_view_count": null,
356
+ "_view_module": "@jupyter-widgets/base",
357
+ "_view_module_version": "1.2.0",
358
+ "_view_name": "StyleView",
359
+ "description_width": ""
360
+ }
361
+ },
362
+ "59acc2626bc74cc599d884f71fd75cba": {
363
+ "model_module": "@jupyter-widgets/controls",
364
+ "model_name": "HBoxModel",
365
+ "model_module_version": "1.5.0",
366
+ "state": {
367
+ "_dom_classes": [],
368
+ "_model_module": "@jupyter-widgets/controls",
369
+ "_model_module_version": "1.5.0",
370
+ "_model_name": "HBoxModel",
371
+ "_view_count": null,
372
+ "_view_module": "@jupyter-widgets/controls",
373
+ "_view_module_version": "1.5.0",
374
+ "_view_name": "HBoxView",
375
+ "box_style": "",
376
+ "children": [
377
+ "IPY_MODEL_1db26de9b6b64c5b8de26568ccb901a7",
378
+ "IPY_MODEL_56236cd346d84fd6b2e7fa3f1eb2558e",
379
+ "IPY_MODEL_6f2a85b3bc0247e19ad895cc978c6b49"
380
+ ],
381
+ "layout": "IPY_MODEL_257f85824ba34de9baf7ee043100ffa2"
382
+ }
383
+ },
384
+ "1db26de9b6b64c5b8de26568ccb901a7": {
385
+ "model_module": "@jupyter-widgets/controls",
386
+ "model_name": "HTMLModel",
387
+ "model_module_version": "1.5.0",
388
+ "state": {
389
+ "_dom_classes": [],
390
+ "_model_module": "@jupyter-widgets/controls",
391
+ "_model_module_version": "1.5.0",
392
+ "_model_name": "HTMLModel",
393
+ "_view_count": null,
394
+ "_view_module": "@jupyter-widgets/controls",
395
+ "_view_module_version": "1.5.0",
396
+ "_view_name": "HTMLView",
397
+ "description": "",
398
+ "description_tooltip": null,
399
+ "layout": "IPY_MODEL_8372b038ce5b476594208492c5af3d9a",
400
+ "placeholder": "​",
401
+ "style": "IPY_MODEL_3e80894f5c124f39b3c2324938297e72",
402
+ "value": "Downloading (…)/adapter_config.json: 100%"
403
+ }
404
+ },
405
+ "56236cd346d84fd6b2e7fa3f1eb2558e": {
406
+ "model_module": "@jupyter-widgets/controls",
407
+ "model_name": "FloatProgressModel",
408
+ "model_module_version": "1.5.0",
409
+ "state": {
410
+ "_dom_classes": [],
411
+ "_model_module": "@jupyter-widgets/controls",
412
+ "_model_module_version": "1.5.0",
413
+ "_model_name": "FloatProgressModel",
414
+ "_view_count": null,
415
+ "_view_module": "@jupyter-widgets/controls",
416
+ "_view_module_version": "1.5.0",
417
+ "_view_name": "ProgressView",
418
+ "bar_style": "success",
419
+ "description": "",
420
+ "description_tooltip": null,
421
+ "layout": "IPY_MODEL_eb8bc82794d14a21b06da73b9f0bc7b8",
422
+ "max": 435,
423
+ "min": 0,
424
+ "orientation": "horizontal",
425
+ "style": "IPY_MODEL_adcdf199f76e428992df54bf4c168109",
426
+ "value": 435
427
+ }
428
+ },
429
+ "6f2a85b3bc0247e19ad895cc978c6b49": {
430
+ "model_module": "@jupyter-widgets/controls",
431
+ "model_name": "HTMLModel",
432
+ "model_module_version": "1.5.0",
433
+ "state": {
434
+ "_dom_classes": [],
435
+ "_model_module": "@jupyter-widgets/controls",
436
+ "_model_module_version": "1.5.0",
437
+ "_model_name": "HTMLModel",
438
+ "_view_count": null,
439
+ "_view_module": "@jupyter-widgets/controls",
440
+ "_view_module_version": "1.5.0",
441
+ "_view_name": "HTMLView",
442
+ "description": "",
443
+ "description_tooltip": null,
444
+ "layout": "IPY_MODEL_0528160bc14d4a209915bda765f17aad",
445
+ "placeholder": "​",
446
+ "style": "IPY_MODEL_410807c07bee4496af3b837d19c65c5d",
447
+ "value": " 435/435 [00:00<00:00, 36.0kB/s]"
448
+ }
449
+ },
450
+ "257f85824ba34de9baf7ee043100ffa2": {
451
+ "model_module": "@jupyter-widgets/base",
452
+ "model_name": "LayoutModel",
453
+ "model_module_version": "1.2.0",
454
+ "state": {
455
+ "_model_module": "@jupyter-widgets/base",
456
+ "_model_module_version": "1.2.0",
457
+ "_model_name": "LayoutModel",
458
+ "_view_count": null,
459
+ "_view_module": "@jupyter-widgets/base",
460
+ "_view_module_version": "1.2.0",
461
+ "_view_name": "LayoutView",
462
+ "align_content": null,
463
+ "align_items": null,
464
+ "align_self": null,
465
+ "border": null,
466
+ "bottom": null,
467
+ "display": null,
468
+ "flex": null,
469
+ "flex_flow": null,
470
+ "grid_area": null,
471
+ "grid_auto_columns": null,
472
+ "grid_auto_flow": null,
473
+ "grid_auto_rows": null,
474
+ "grid_column": null,
475
+ "grid_gap": null,
476
+ "grid_row": null,
477
+ "grid_template_areas": null,
478
+ "grid_template_columns": null,
479
+ "grid_template_rows": null,
480
+ "height": null,
481
+ "justify_content": null,
482
+ "justify_items": null,
483
+ "left": null,
484
+ "margin": null,
485
+ "max_height": null,
486
+ "max_width": null,
487
+ "min_height": null,
488
+ "min_width": null,
489
+ "object_fit": null,
490
+ "object_position": null,
491
+ "order": null,
492
+ "overflow": null,
493
+ "overflow_x": null,
494
+ "overflow_y": null,
495
+ "padding": null,
496
+ "right": null,
497
+ "top": null,
498
+ "visibility": null,
499
+ "width": null
500
+ }
501
+ },
502
+ "8372b038ce5b476594208492c5af3d9a": {
503
+ "model_module": "@jupyter-widgets/base",
504
+ "model_name": "LayoutModel",
505
+ "model_module_version": "1.2.0",
506
+ "state": {
507
+ "_model_module": "@jupyter-widgets/base",
508
+ "_model_module_version": "1.2.0",
509
+ "_model_name": "LayoutModel",
510
+ "_view_count": null,
511
+ "_view_module": "@jupyter-widgets/base",
512
+ "_view_module_version": "1.2.0",
513
+ "_view_name": "LayoutView",
514
+ "align_content": null,
515
+ "align_items": null,
516
+ "align_self": null,
517
+ "border": null,
518
+ "bottom": null,
519
+ "display": null,
520
+ "flex": null,
521
+ "flex_flow": null,
522
+ "grid_area": null,
523
+ "grid_auto_columns": null,
524
+ "grid_auto_flow": null,
525
+ "grid_auto_rows": null,
526
+ "grid_column": null,
527
+ "grid_gap": null,
528
+ "grid_row": null,
529
+ "grid_template_areas": null,
530
+ "grid_template_columns": null,
531
+ "grid_template_rows": null,
532
+ "height": null,
533
+ "justify_content": null,
534
+ "justify_items": null,
535
+ "left": null,
536
+ "margin": null,
537
+ "max_height": null,
538
+ "max_width": null,
539
+ "min_height": null,
540
+ "min_width": null,
541
+ "object_fit": null,
542
+ "object_position": null,
543
+ "order": null,
544
+ "overflow": null,
545
+ "overflow_x": null,
546
+ "overflow_y": null,
547
+ "padding": null,
548
+ "right": null,
549
+ "top": null,
550
+ "visibility": null,
551
+ "width": null
552
+ }
553
+ },
554
+ "3e80894f5c124f39b3c2324938297e72": {
555
+ "model_module": "@jupyter-widgets/controls",
556
+ "model_name": "DescriptionStyleModel",
557
+ "model_module_version": "1.5.0",
558
+ "state": {
559
+ "_model_module": "@jupyter-widgets/controls",
560
+ "_model_module_version": "1.5.0",
561
+ "_model_name": "DescriptionStyleModel",
562
+ "_view_count": null,
563
+ "_view_module": "@jupyter-widgets/base",
564
+ "_view_module_version": "1.2.0",
565
+ "_view_name": "StyleView",
566
+ "description_width": ""
567
+ }
568
+ },
569
+ "eb8bc82794d14a21b06da73b9f0bc7b8": {
570
+ "model_module": "@jupyter-widgets/base",
571
+ "model_name": "LayoutModel",
572
+ "model_module_version": "1.2.0",
573
+ "state": {
574
+ "_model_module": "@jupyter-widgets/base",
575
+ "_model_module_version": "1.2.0",
576
+ "_model_name": "LayoutModel",
577
+ "_view_count": null,
578
+ "_view_module": "@jupyter-widgets/base",
579
+ "_view_module_version": "1.2.0",
580
+ "_view_name": "LayoutView",
581
+ "align_content": null,
582
+ "align_items": null,
583
+ "align_self": null,
584
+ "border": null,
585
+ "bottom": null,
586
+ "display": null,
587
+ "flex": null,
588
+ "flex_flow": null,
589
+ "grid_area": null,
590
+ "grid_auto_columns": null,
591
+ "grid_auto_flow": null,
592
+ "grid_auto_rows": null,
593
+ "grid_column": null,
594
+ "grid_gap": null,
595
+ "grid_row": null,
596
+ "grid_template_areas": null,
597
+ "grid_template_columns": null,
598
+ "grid_template_rows": null,
599
+ "height": null,
600
+ "justify_content": null,
601
+ "justify_items": null,
602
+ "left": null,
603
+ "margin": null,
604
+ "max_height": null,
605
+ "max_width": null,
606
+ "min_height": null,
607
+ "min_width": null,
608
+ "object_fit": null,
609
+ "object_position": null,
610
+ "order": null,
611
+ "overflow": null,
612
+ "overflow_x": null,
613
+ "overflow_y": null,
614
+ "padding": null,
615
+ "right": null,
616
+ "top": null,
617
+ "visibility": null,
618
+ "width": null
619
+ }
620
+ },
621
+ "adcdf199f76e428992df54bf4c168109": {
622
+ "model_module": "@jupyter-widgets/controls",
623
+ "model_name": "ProgressStyleModel",
624
+ "model_module_version": "1.5.0",
625
+ "state": {
626
+ "_model_module": "@jupyter-widgets/controls",
627
+ "_model_module_version": "1.5.0",
628
+ "_model_name": "ProgressStyleModel",
629
+ "_view_count": null,
630
+ "_view_module": "@jupyter-widgets/base",
631
+ "_view_module_version": "1.2.0",
632
+ "_view_name": "StyleView",
633
+ "bar_color": null,
634
+ "description_width": ""
635
+ }
636
+ },
637
+ "0528160bc14d4a209915bda765f17aad": {
638
+ "model_module": "@jupyter-widgets/base",
639
+ "model_name": "LayoutModel",
640
+ "model_module_version": "1.2.0",
641
+ "state": {
642
+ "_model_module": "@jupyter-widgets/base",
643
+ "_model_module_version": "1.2.0",
644
+ "_model_name": "LayoutModel",
645
+ "_view_count": null,
646
+ "_view_module": "@jupyter-widgets/base",
647
+ "_view_module_version": "1.2.0",
648
+ "_view_name": "LayoutView",
649
+ "align_content": null,
650
+ "align_items": null,
651
+ "align_self": null,
652
+ "border": null,
653
+ "bottom": null,
654
+ "display": null,
655
+ "flex": null,
656
+ "flex_flow": null,
657
+ "grid_area": null,
658
+ "grid_auto_columns": null,
659
+ "grid_auto_flow": null,
660
+ "grid_auto_rows": null,
661
+ "grid_column": null,
662
+ "grid_gap": null,
663
+ "grid_row": null,
664
+ "grid_template_areas": null,
665
+ "grid_template_columns": null,
666
+ "grid_template_rows": null,
667
+ "height": null,
668
+ "justify_content": null,
669
+ "justify_items": null,
670
+ "left": null,
671
+ "margin": null,
672
+ "max_height": null,
673
+ "max_width": null,
674
+ "min_height": null,
675
+ "min_width": null,
676
+ "object_fit": null,
677
+ "object_position": null,
678
+ "order": null,
679
+ "overflow": null,
680
+ "overflow_x": null,
681
+ "overflow_y": null,
682
+ "padding": null,
683
+ "right": null,
684
+ "top": null,
685
+ "visibility": null,
686
+ "width": null
687
+ }
688
+ },
689
+ "410807c07bee4496af3b837d19c65c5d": {
690
+ "model_module": "@jupyter-widgets/controls",
691
+ "model_name": "DescriptionStyleModel",
692
+ "model_module_version": "1.5.0",
693
+ "state": {
694
+ "_model_module": "@jupyter-widgets/controls",
695
+ "_model_module_version": "1.5.0",
696
+ "_model_name": "DescriptionStyleModel",
697
+ "_view_count": null,
698
+ "_view_module": "@jupyter-widgets/base",
699
+ "_view_module_version": "1.2.0",
700
+ "_view_name": "StyleView",
701
+ "description_width": ""
702
+ }
703
+ },
704
+ "352882e23bcf487f81b002ab676dac0a": {
705
+ "model_module": "@jupyter-widgets/controls",
706
+ "model_name": "HBoxModel",
707
+ "model_module_version": "1.5.0",
708
+ "state": {
709
+ "_dom_classes": [],
710
+ "_model_module": "@jupyter-widgets/controls",
711
+ "_model_module_version": "1.5.0",
712
+ "_model_name": "HBoxModel",
713
+ "_view_count": null,
714
+ "_view_module": "@jupyter-widgets/controls",
715
+ "_view_module_version": "1.5.0",
716
+ "_view_name": "HBoxView",
717
+ "box_style": "",
718
+ "children": [
719
+ "IPY_MODEL_5abcd19a14104376be50cef9a019cb74",
720
+ "IPY_MODEL_1b3bf0704b464b7f8574d74fd63073ae",
721
+ "IPY_MODEL_82cda2a3ece54182ba7e0ebeaf3fee55"
722
+ ],
723
+ "layout": "IPY_MODEL_4435738d377d4a9da21897f689de9cf2"
724
+ }
725
+ },
726
+ "5abcd19a14104376be50cef9a019cb74": {
727
+ "model_module": "@jupyter-widgets/controls",
728
+ "model_name": "HTMLModel",
729
+ "model_module_version": "1.5.0",
730
+ "state": {
731
+ "_dom_classes": [],
732
+ "_model_module": "@jupyter-widgets/controls",
733
+ "_model_module_version": "1.5.0",
734
+ "_model_name": "HTMLModel",
735
+ "_view_count": null,
736
+ "_view_module": "@jupyter-widgets/controls",
737
+ "_view_module_version": "1.5.0",
738
+ "_view_name": "HTMLView",
739
+ "description": "",
740
+ "description_tooltip": null,
741
+ "layout": "IPY_MODEL_517cab5a4e054ded828890c3ef8f0ef3",
742
+ "placeholder": "​",
743
+ "style": "IPY_MODEL_2244c231788845e585e844223815ac89",
744
+ "value": "Downloading adapter_model.bin: 100%"
745
+ }
746
+ },
747
+ "1b3bf0704b464b7f8574d74fd63073ae": {
748
+ "model_module": "@jupyter-widgets/controls",
749
+ "model_name": "FloatProgressModel",
750
+ "model_module_version": "1.5.0",
751
+ "state": {
752
+ "_dom_classes": [],
753
+ "_model_module": "@jupyter-widgets/controls",
754
+ "_model_module_version": "1.5.0",
755
+ "_model_name": "FloatProgressModel",
756
+ "_view_count": null,
757
+ "_view_module": "@jupyter-widgets/controls",
758
+ "_view_module_version": "1.5.0",
759
+ "_view_name": "ProgressView",
760
+ "bar_style": "success",
761
+ "description": "",
762
+ "description_tooltip": null,
763
+ "layout": "IPY_MODEL_7c8a4dd1ac8844759e294a4fbb4105e3",
764
+ "max": 67201357,
765
+ "min": 0,
766
+ "orientation": "horizontal",
767
+ "style": "IPY_MODEL_782fb1d51292417293e656a3adfa5e7c",
768
+ "value": 67201357
769
+ }
770
+ },
771
+ "82cda2a3ece54182ba7e0ebeaf3fee55": {
772
+ "model_module": "@jupyter-widgets/controls",
773
+ "model_name": "HTMLModel",
774
+ "model_module_version": "1.5.0",
775
+ "state": {
776
+ "_dom_classes": [],
777
+ "_model_module": "@jupyter-widgets/controls",
778
+ "_model_module_version": "1.5.0",
779
+ "_model_name": "HTMLModel",
780
+ "_view_count": null,
781
+ "_view_module": "@jupyter-widgets/controls",
782
+ "_view_module_version": "1.5.0",
783
+ "_view_name": "HTMLView",
784
+ "description": "",
785
+ "description_tooltip": null,
786
+ "layout": "IPY_MODEL_c88603c1ffc94d23851357c1603ad087",
787
+ "placeholder": "​",
788
+ "style": "IPY_MODEL_d6ca77ebe0c8430ca868f5adda909243",
789
+ "value": " 67.2M/67.2M [00:05<00:00, 15.1MB/s]"
790
+ }
791
+ },
792
+ "4435738d377d4a9da21897f689de9cf2": {
793
+ "model_module": "@jupyter-widgets/base",
794
+ "model_name": "LayoutModel",
795
+ "model_module_version": "1.2.0",
796
+ "state": {
797
+ "_model_module": "@jupyter-widgets/base",
798
+ "_model_module_version": "1.2.0",
799
+ "_model_name": "LayoutModel",
800
+ "_view_count": null,
801
+ "_view_module": "@jupyter-widgets/base",
802
+ "_view_module_version": "1.2.0",
803
+ "_view_name": "LayoutView",
804
+ "align_content": null,
805
+ "align_items": null,
806
+ "align_self": null,
807
+ "border": null,
808
+ "bottom": null,
809
+ "display": null,
810
+ "flex": null,
811
+ "flex_flow": null,
812
+ "grid_area": null,
813
+ "grid_auto_columns": null,
814
+ "grid_auto_flow": null,
815
+ "grid_auto_rows": null,
816
+ "grid_column": null,
817
+ "grid_gap": null,
818
+ "grid_row": null,
819
+ "grid_template_areas": null,
820
+ "grid_template_columns": null,
821
+ "grid_template_rows": null,
822
+ "height": null,
823
+ "justify_content": null,
824
+ "justify_items": null,
825
+ "left": null,
826
+ "margin": null,
827
+ "max_height": null,
828
+ "max_width": null,
829
+ "min_height": null,
830
+ "min_width": null,
831
+ "object_fit": null,
832
+ "object_position": null,
833
+ "order": null,
834
+ "overflow": null,
835
+ "overflow_x": null,
836
+ "overflow_y": null,
837
+ "padding": null,
838
+ "right": null,
839
+ "top": null,
840
+ "visibility": null,
841
+ "width": null
842
+ }
843
+ },
844
+ "517cab5a4e054ded828890c3ef8f0ef3": {
845
+ "model_module": "@jupyter-widgets/base",
846
+ "model_name": "LayoutModel",
847
+ "model_module_version": "1.2.0",
848
+ "state": {
849
+ "_model_module": "@jupyter-widgets/base",
850
+ "_model_module_version": "1.2.0",
851
+ "_model_name": "LayoutModel",
852
+ "_view_count": null,
853
+ "_view_module": "@jupyter-widgets/base",
854
+ "_view_module_version": "1.2.0",
855
+ "_view_name": "LayoutView",
856
+ "align_content": null,
857
+ "align_items": null,
858
+ "align_self": null,
859
+ "border": null,
860
+ "bottom": null,
861
+ "display": null,
862
+ "flex": null,
863
+ "flex_flow": null,
864
+ "grid_area": null,
865
+ "grid_auto_columns": null,
866
+ "grid_auto_flow": null,
867
+ "grid_auto_rows": null,
868
+ "grid_column": null,
869
+ "grid_gap": null,
870
+ "grid_row": null,
871
+ "grid_template_areas": null,
872
+ "grid_template_columns": null,
873
+ "grid_template_rows": null,
874
+ "height": null,
875
+ "justify_content": null,
876
+ "justify_items": null,
877
+ "left": null,
878
+ "margin": null,
879
+ "max_height": null,
880
+ "max_width": null,
881
+ "min_height": null,
882
+ "min_width": null,
883
+ "object_fit": null,
884
+ "object_position": null,
885
+ "order": null,
886
+ "overflow": null,
887
+ "overflow_x": null,
888
+ "overflow_y": null,
889
+ "padding": null,
890
+ "right": null,
891
+ "top": null,
892
+ "visibility": null,
893
+ "width": null
894
+ }
895
+ },
896
+ "2244c231788845e585e844223815ac89": {
897
+ "model_module": "@jupyter-widgets/controls",
898
+ "model_name": "DescriptionStyleModel",
899
+ "model_module_version": "1.5.0",
900
+ "state": {
901
+ "_model_module": "@jupyter-widgets/controls",
902
+ "_model_module_version": "1.5.0",
903
+ "_model_name": "DescriptionStyleModel",
904
+ "_view_count": null,
905
+ "_view_module": "@jupyter-widgets/base",
906
+ "_view_module_version": "1.2.0",
907
+ "_view_name": "StyleView",
908
+ "description_width": ""
909
+ }
910
+ },
911
+ "7c8a4dd1ac8844759e294a4fbb4105e3": {
912
+ "model_module": "@jupyter-widgets/base",
913
+ "model_name": "LayoutModel",
914
+ "model_module_version": "1.2.0",
915
+ "state": {
916
+ "_model_module": "@jupyter-widgets/base",
917
+ "_model_module_version": "1.2.0",
918
+ "_model_name": "LayoutModel",
919
+ "_view_count": null,
920
+ "_view_module": "@jupyter-widgets/base",
921
+ "_view_module_version": "1.2.0",
922
+ "_view_name": "LayoutView",
923
+ "align_content": null,
924
+ "align_items": null,
925
+ "align_self": null,
926
+ "border": null,
927
+ "bottom": null,
928
+ "display": null,
929
+ "flex": null,
930
+ "flex_flow": null,
931
+ "grid_area": null,
932
+ "grid_auto_columns": null,
933
+ "grid_auto_flow": null,
934
+ "grid_auto_rows": null,
935
+ "grid_column": null,
936
+ "grid_gap": null,
937
+ "grid_row": null,
938
+ "grid_template_areas": null,
939
+ "grid_template_columns": null,
940
+ "grid_template_rows": null,
941
+ "height": null,
942
+ "justify_content": null,
943
+ "justify_items": null,
944
+ "left": null,
945
+ "margin": null,
946
+ "max_height": null,
947
+ "max_width": null,
948
+ "min_height": null,
949
+ "min_width": null,
950
+ "object_fit": null,
951
+ "object_position": null,
952
+ "order": null,
953
+ "overflow": null,
954
+ "overflow_x": null,
955
+ "overflow_y": null,
956
+ "padding": null,
957
+ "right": null,
958
+ "top": null,
959
+ "visibility": null,
960
+ "width": null
961
+ }
962
+ },
963
+ "782fb1d51292417293e656a3adfa5e7c": {
964
+ "model_module": "@jupyter-widgets/controls",
965
+ "model_name": "ProgressStyleModel",
966
+ "model_module_version": "1.5.0",
967
+ "state": {
968
+ "_model_module": "@jupyter-widgets/controls",
969
+ "_model_module_version": "1.5.0",
970
+ "_model_name": "ProgressStyleModel",
971
+ "_view_count": null,
972
+ "_view_module": "@jupyter-widgets/base",
973
+ "_view_module_version": "1.2.0",
974
+ "_view_name": "StyleView",
975
+ "bar_color": null,
976
+ "description_width": ""
977
+ }
978
+ },
979
+ "c88603c1ffc94d23851357c1603ad087": {
980
+ "model_module": "@jupyter-widgets/base",
981
+ "model_name": "LayoutModel",
982
+ "model_module_version": "1.2.0",
983
+ "state": {
984
+ "_model_module": "@jupyter-widgets/base",
985
+ "_model_module_version": "1.2.0",
986
+ "_model_name": "LayoutModel",
987
+ "_view_count": null,
988
+ "_view_module": "@jupyter-widgets/base",
989
+ "_view_module_version": "1.2.0",
990
+ "_view_name": "LayoutView",
991
+ "align_content": null,
992
+ "align_items": null,
993
+ "align_self": null,
994
+ "border": null,
995
+ "bottom": null,
996
+ "display": null,
997
+ "flex": null,
998
+ "flex_flow": null,
999
+ "grid_area": null,
1000
+ "grid_auto_columns": null,
1001
+ "grid_auto_flow": null,
1002
+ "grid_auto_rows": null,
1003
+ "grid_column": null,
1004
+ "grid_gap": null,
1005
+ "grid_row": null,
1006
+ "grid_template_areas": null,
1007
+ "grid_template_columns": null,
1008
+ "grid_template_rows": null,
1009
+ "height": null,
1010
+ "justify_content": null,
1011
+ "justify_items": null,
1012
+ "left": null,
1013
+ "margin": null,
1014
+ "max_height": null,
1015
+ "max_width": null,
1016
+ "min_height": null,
1017
+ "min_width": null,
1018
+ "object_fit": null,
1019
+ "object_position": null,
1020
+ "order": null,
1021
+ "overflow": null,
1022
+ "overflow_x": null,
1023
+ "overflow_y": null,
1024
+ "padding": null,
1025
+ "right": null,
1026
+ "top": null,
1027
+ "visibility": null,
1028
+ "width": null
1029
+ }
1030
+ },
1031
+ "d6ca77ebe0c8430ca868f5adda909243": {
1032
+ "model_module": "@jupyter-widgets/controls",
1033
+ "model_name": "DescriptionStyleModel",
1034
+ "model_module_version": "1.5.0",
1035
+ "state": {
1036
+ "_model_module": "@jupyter-widgets/controls",
1037
+ "_model_module_version": "1.5.0",
1038
+ "_model_name": "DescriptionStyleModel",
1039
+ "_view_count": null,
1040
+ "_view_module": "@jupyter-widgets/base",
1041
+ "_view_module_version": "1.2.0",
1042
+ "_view_name": "StyleView",
1043
+ "description_width": ""
1044
+ }
1045
+ }
1046
+ }
1047
+ }
1048
+ },
1049
+ "cells": [
1050
+ {
1051
+ "cell_type": "code",
1052
+ "execution_count": null,
1053
+ "metadata": {
1054
+ "id": "EffVs46Xm6kO"
1055
+ },
1056
+ "outputs": [],
1057
+ "source": [
1058
+ "!pip -q install git+https://github.com/huggingface/transformers.git\n",
1059
+ "!pip -q install peft\n",
1060
+ "!pip -q install accelerate\n",
1061
+ "!pip -q install sentencepiece\n",
1062
+ "!pip -q install bitsandbytes"
1063
+ ]
1064
+ },
1065
+ {
1066
+ "cell_type": "code",
1067
+ "source": [
1068
+ "from IPython.display import Markdown as md\n",
1069
+ "\n",
1070
+ "import transformers\n",
1071
+ "import peft\n",
1072
+ "import accelerate\n",
1073
+ "import bitsandbytes\n",
1074
+ "\n",
1075
+ "print(transformers.__version__)\n",
1076
+ "print(peft.__version__)\n",
1077
+ "print(accelerate.__version__)\n"
1078
+ ],
1079
+ "metadata": {
1080
+ "id": "p0WQoR0cm-LA"
1081
+ },
1082
+ "execution_count": null,
1083
+ "outputs": []
1084
+ },
1085
+ {
1086
+ "cell_type": "code",
1087
+ "source": [
1088
+ "import torch\n",
1089
+ "from peft import PeftModel\n",
1090
+ "from transformers import LlamaTokenizer, LlamaForCausalLM\n",
1091
+ "\n",
1092
+ "def load_model(base, finetuned):\n",
1093
+ " tokenizer = LlamaTokenizer.from_pretrained(base)\n",
1094
+ " tokenizer.pad_token_id = 0\n",
1095
+ " tokenizer.padding_side = \"left\"\n",
1096
+ "\n",
1097
+ " model = LlamaForCausalLM.from_pretrained(\n",
1098
+ " base,\n",
1099
+ " load_in_8bit=True,\n",
1100
+ " device_map=\"auto\",\n",
1101
+ " )\n",
1102
+ " \n",
1103
+ " model = PeftModel.from_pretrained(\n",
1104
+ " model, \n",
1105
+ " finetuned,\n",
1106
+ " device_map={'': 0}\n",
1107
+ " )\n",
1108
+ " return model, tokenizer\n",
1109
+ "\n",
1110
+ "def get_output_batch(\n",
1111
+ " model, tokenizer, prompt, generation_config, device='cuda'\n",
1112
+ "):\n",
1113
+ " encoding = tokenizer(prompt, return_tensors=\"pt\")\n",
1114
+ " input_ids = encoding[\"input_ids\"].to(device)\n",
1115
+ " generated_id = model.generate(\n",
1116
+ " input_ids=input_ids,\n",
1117
+ " generation_config=generation_config,\n",
1118
+ " max_new_tokens=256\n",
1119
+ " )\n",
1120
+ "\n",
1121
+ " decoded = tokenizer.batch_decode(\n",
1122
+ " generated_id, skip_prompt=True, skip_special_tokens=True\n",
1123
+ " )\n",
1124
+ " del input_ids, generated_id\n",
1125
+ " torch.cuda.empty_cache()\n",
1126
+ " return decoded[0].split(\"### Response:\")[-1]"
1127
+ ],
1128
+ "metadata": {
1129
+ "id": "fdW1Xhi-nM_G"
1130
+ },
1131
+ "execution_count": 2,
1132
+ "outputs": []
1133
+ },
1134
+ {
1135
+ "cell_type": "markdown",
1136
+ "source": [
1137
+ "### AlpacaGPT4-LoRA 7B (05/01)"
1138
+ ],
1139
+ "metadata": {
1140
+ "id": "mWIAXIlQn87-"
1141
+ }
1142
+ },
1143
+ {
1144
+ "cell_type": "code",
1145
+ "source": [
1146
+ "from transformers import GenerationConfig\n",
1147
+ "\n",
1148
+ "base = \"elinas/llama-7b-hf-transformers-4.29\"\n",
1149
+ "sft = \"LLMs/AlpacaGPT4-LoRA-7B-elina\"\n",
1150
+ "\n",
1151
+ "genConfig = GenerationConfig(\n",
1152
+ " temperature=0.95,\n",
1153
+ " top_p=0.9,\n",
1154
+ " top_k=50,\n",
1155
+ " num_beams=1,\n",
1156
+ " repetition_penalty=1.2,\n",
1157
+ " max_new_token=2048,\n",
1158
+ " do_sample=True,\n",
1159
+ ")"
1160
+ ],
1161
+ "metadata": {
1162
+ "id": "_ZzZ5A6wn8p_"
1163
+ },
1164
+ "execution_count": 3,
1165
+ "outputs": []
1166
+ },
1167
+ {
1168
+ "cell_type": "code",
1169
+ "source": [
1170
+ "model, tokenizer = load_model(base, sft)"
1171
+ ],
1172
+ "metadata": {
1173
+ "colab": {
1174
+ "base_uri": "https://localhost:8080/",
1175
+ "height": 151,
1176
+ "referenced_widgets": [
1177
+ "f0a180029cfc4c59b80697222ffc804e",
1178
+ "e608b9052a6d4e2491eb3b63dc7c8d03",
1179
+ "36c64a38fd804214b83c0b2645f5a5ca",
1180
+ "dfd3e291cb1b47938bba1d240c2915ab",
1181
+ "a991ae67d77b4dd4ae30e6ac0e899be1",
1182
+ "8dfa9dd2f1b14615be5c00949dcbb318",
1183
+ "8f2b68c72f4e41f98b42365561addef3",
1184
+ "a5f11527f2eb407ea3c702416d6e8f04",
1185
+ "47c9e6973fe949f9951fb2d7e725dd43",
1186
+ "454bcb8132ba4024ba69f93374525765",
1187
+ "a4db771090f74fb995c6e78ed0e9b9c8",
1188
+ "59acc2626bc74cc599d884f71fd75cba",
1189
+ "1db26de9b6b64c5b8de26568ccb901a7",
1190
+ "56236cd346d84fd6b2e7fa3f1eb2558e",
1191
+ "6f2a85b3bc0247e19ad895cc978c6b49",
1192
+ "257f85824ba34de9baf7ee043100ffa2",
1193
+ "8372b038ce5b476594208492c5af3d9a",
1194
+ "3e80894f5c124f39b3c2324938297e72",
1195
+ "eb8bc82794d14a21b06da73b9f0bc7b8",
1196
+ "adcdf199f76e428992df54bf4c168109",
1197
+ "0528160bc14d4a209915bda765f17aad",
1198
+ "410807c07bee4496af3b837d19c65c5d",
1199
+ "352882e23bcf487f81b002ab676dac0a",
1200
+ "5abcd19a14104376be50cef9a019cb74",
1201
+ "1b3bf0704b464b7f8574d74fd63073ae",
1202
+ "82cda2a3ece54182ba7e0ebeaf3fee55",
1203
+ "4435738d377d4a9da21897f689de9cf2",
1204
+ "517cab5a4e054ded828890c3ef8f0ef3",
1205
+ "2244c231788845e585e844223815ac89",
1206
+ "7c8a4dd1ac8844759e294a4fbb4105e3",
1207
+ "782fb1d51292417293e656a3adfa5e7c",
1208
+ "c88603c1ffc94d23851357c1603ad087",
1209
+ "d6ca77ebe0c8430ca868f5adda909243"
1210
+ ]
1211
+ },
1212
+ "id": "VlMCjqebn4yT",
1213
+ "outputId": "d3c01962-1759-450b-b83c-048e6b3503bc"
1214
+ },
1215
+ "execution_count": 4,
1216
+ "outputs": [
1217
+ {
1218
+ "output_type": "stream",
1219
+ "name": "stderr",
1220
+ "text": [
1221
+ "Overriding torch_dtype=None with `torch_dtype=torch.float16` due to requirements of `bitsandbytes` to enable model loading in mixed int8. Either pass torch_dtype=torch.float16 or don't pass this argument at all to remove this warning.\n"
1222
+ ]
1223
+ },
1224
+ {
1225
+ "output_type": "display_data",
1226
+ "data": {
1227
+ "text/plain": [
1228
+ "Loading checkpoint shards: 0%| | 0/2 [00:00<?, ?it/s]"
1229
+ ],
1230
+ "application/vnd.jupyter.widget-view+json": {
1231
+ "version_major": 2,
1232
+ "version_minor": 0,
1233
+ "model_id": "f0a180029cfc4c59b80697222ffc804e"
1234
+ }
1235
+ },
1236
+ "metadata": {}
1237
+ },
1238
+ {
1239
+ "output_type": "display_data",
1240
+ "data": {
1241
+ "text/plain": [
1242
+ "Downloading (…)/adapter_config.json: 0%| | 0.00/435 [00:00<?, ?B/s]"
1243
+ ],
1244
+ "application/vnd.jupyter.widget-view+json": {
1245
+ "version_major": 2,
1246
+ "version_minor": 0,
1247
+ "model_id": "59acc2626bc74cc599d884f71fd75cba"
1248
+ }
1249
+ },
1250
+ "metadata": {}
1251
+ },
1252
+ {
1253
+ "output_type": "display_data",
1254
+ "data": {
1255
+ "text/plain": [
1256
+ "Downloading adapter_model.bin: 0%| | 0.00/67.2M [00:00<?, ?B/s]"
1257
+ ],
1258
+ "application/vnd.jupyter.widget-view+json": {
1259
+ "version_major": 2,
1260
+ "version_minor": 0,
1261
+ "model_id": "352882e23bcf487f81b002ab676dac0a"
1262
+ }
1263
+ },
1264
+ "metadata": {}
1265
+ }
1266
+ ]
1267
+ },
1268
+ {
1269
+ "cell_type": "code",
1270
+ "source": [
1271
+ "prompt = \"\"\"### Instruction: Compose an engaging travel blog post about a recent trip to Hawaii, highlighting cultural experiences and must-see attractions.\n",
1272
+ "\n",
1273
+ "### Response:\"\"\"\n",
1274
+ "\n",
1275
+ "output = get_output_batch(model, tokenizer, prompt, genConfig)\n",
1276
+ "md(output.replace(\"\\n\", \"<br />\"))"
1277
+ ],
1278
+ "metadata": {
1279
+ "colab": {
1280
+ "base_uri": "https://localhost:8080/",
1281
+ "height": 185
1282
+ },
1283
+ "id": "z3WRDweToO1u",
1284
+ "outputId": "6a35a027-e29e-4290-e7f5-7c0fc8537d87"
1285
+ },
1286
+ "execution_count": 5,
1287
+ "outputs": [
1288
+ {
1289
+ "output_type": "execute_result",
1290
+ "data": {
1291
+ "text/plain": [
1292
+ "<IPython.core.display.Markdown object>"
1293
+ ],
1294
+ "text/markdown": "<br />Dear Travelers, <br />Have you ever wondered what it's like to step foot on one of the most famous islands in the world? Have you dreamt of experiencing its natural beauty and exotic culture? Well, here at Explorify we have just returned from our epic journey to paradise - HAWAII! As experienced tourists and avid explorers ourselves, we had the opportunity to embark upon the adventure of a lifetime and bring back some truly unforgettable memories. Our first stop was Oahu Island where we visited numerous locations such as Diamond Head State Monument, The Pali Lookout & Nu’uanu Valley Overlook for panoramic views over Honolulu, Waikiki Beach, Kualoa Regional Park with lush greenery and picturesque valleys all around us. We took part in many activities including hiking through breathtaking trails, snorkeling and swimming in crystal clear waters surrounded by colorful marine life and fishes while enjoying magnificent underwater scenes. In addition to visiting Pearl Harbor Memorial and witnessing military history up close, we also went deep sea fishing aboard cat"
1295
+ },
1296
+ "metadata": {},
1297
+ "execution_count": 5
1298
+ }
1299
+ ]
1300
+ },
1301
+ {
1302
+ "cell_type": "code",
1303
+ "source": [
1304
+ "prompt = \"\"\"### Instruction: Can you help me write a formal email to a potential business partner proposing a joint venture?\n",
1305
+ "\n",
1306
+ "### Response:\"\"\"\n",
1307
+ "\n",
1308
+ "output = get_output_batch(model, tokenizer, prompt, genConfig)\n",
1309
+ "md(output.replace(\"\\n\", \"<br />\"))"
1310
+ ],
1311
+ "metadata": {
1312
+ "colab": {
1313
+ "base_uri": "https://localhost:8080/",
1314
+ "height": 185
1315
+ },
1316
+ "id": "P0menmcsuK8L",
1317
+ "outputId": "b69751cb-dfd5-46cc-f88a-28ad2c0798b7"
1318
+ },
1319
+ "execution_count": 6,
1320
+ "outputs": [
1321
+ {
1322
+ "output_type": "execute_result",
1323
+ "data": {
1324
+ "text/plain": [
1325
+ "<IPython.core.display.Markdown object>"
1326
+ ],
1327
+ "text/markdown": "<br />Dear [Partner Name], <br /><br />We are excited about the prospect of creating a new partnership with your organization and we hope that this letter serves as an opportunity for us to discuss in detail our proposal. We at Company X have been researching various options available to expand our service offerings, and we believe that a joint venture would be mutually beneficial. As part of the collaboration, both parties will receive a share of profits based on their respective contributions made towards achieving common goals such as increasing market penetration, improving efficiency and reducing costs while maintaining high-quality standards. In addition, each company can leverage its expertise to create value for customers through innovative products or services. Finally, the resulting synergy between our two organizations is expected to deliver long-term benefits."
1328
+ },
1329
+ "metadata": {},
1330
+ "execution_count": 6
1331
+ }
1332
+ ]
1333
+ },
1334
+ {
1335
+ "cell_type": "code",
1336
+ "source": [
1337
+ "prompt = \"\"\"### Instruction: Can you help me write a resignation letter to my current employer, while leaving on good terms and expressing gratitude for the opportunities provided?\n",
1338
+ "\n",
1339
+ "### Response:\"\"\"\n",
1340
+ "\n",
1341
+ "output = get_output_batch(model, tokenizer, prompt, genConfig)\n",
1342
+ "md(output.replace(\"\\n\", \"<br />\"))"
1343
+ ],
1344
+ "metadata": {
1345
+ "colab": {
1346
+ "base_uri": "https://localhost:8080/",
1347
+ "height": 220
1348
+ },
1349
+ "id": "0XmVJacyxHw8",
1350
+ "outputId": "8353bf42-140d-4567-9e1d-954a5500d3a7"
1351
+ },
1352
+ "execution_count": 7,
1353
+ "outputs": [
1354
+ {
1355
+ "output_type": "execute_result",
1356
+ "data": {
1357
+ "text/plain": [
1358
+ "<IPython.core.display.Markdown object>"
1359
+ ],
1360
+ "text/markdown": " Dear [Name of Employer],<br /><br />After much consideration, I regretfully inform you that I will be ending my employment with your company. It has been an honor working alongside all of you during this time, and it is with great sadness that I must move forward from this position. <br /><br />My decision was not made lightly; I have greatly appreciated being given the opportunity to grow professionally as well as personally in this role. You have helped fostered an environment where collaboration and teamwork are valued, and the knowledge that we each bring together creates innovative solutions every day. Thank you for providing me with a supportive workplace, challenges, learning experiences, and personal growth throughout these years. <br /><br />In closing, know that even though I am stepping away, our relationship remains important and valuable to both parties involved. Please accept this letter as both my resignation but also my sincere appreciation and wish for continued success within the organization."
1361
+ },
1362
+ "metadata": {},
1363
+ "execution_count": 7
1364
+ }
1365
+ ]
1366
+ },
1367
+ {
1368
+ "cell_type": "markdown",
1369
+ "source": [],
1370
+ "metadata": {
1371
+ "id": "o20g3usqyVlo"
1372
+ }
1373
+ },
1374
+ {
1375
+ "cell_type": "code",
1376
+ "source": [
1377
+ "prompt = \"\"\"### Instruction: How can you determine if a restaurant is popular among locals or mainly attracts tourists, and why might this information be useful?\n",
1378
+ "\n",
1379
+ "### Response:\"\"\"\n",
1380
+ "\n",
1381
+ "output = get_output_batch(model, tokenizer, prompt, genConfig)\n",
1382
+ "md(output.replace(\"\\n\", \"<br />\"))"
1383
+ ],
1384
+ "metadata": {
1385
+ "colab": {
1386
+ "base_uri": "https://localhost:8080/",
1387
+ "height": 168
1388
+ },
1389
+ "id": "vILBz5Nfx7RW",
1390
+ "outputId": "6437c9ad-be00-43d0-ddb8-18c8462f33e0"
1391
+ },
1392
+ "execution_count": 8,
1393
+ "outputs": [
1394
+ {
1395
+ "output_type": "execute_result",
1396
+ "data": {
1397
+ "text/plain": [
1398
+ "<IPython.core.display.Markdown object>"
1399
+ ],
1400
+ "text/markdown": " <br />If a restaurant is primarily visited by local residents rather than tourist it means that the food offered there has been reviewed positively on social media and shared through word-of-mouth recommendations. It also means that they have established themselves as an authentic local establishment in the area where people would visit for their favorite dishes. This kind of restaurant provides more memorable experiences to visitors since they are able to taste real local cuisine that cannot be found elsewhere. On the other hand, restaurants aiming at tourism may offer overpriced meals with exotic ingredients from far away places which don't really appeal to most people living locally but appealed to many travelers. A restaurant being mostly frequented by locals indicates a higher likelihood of providing quality local fare, unique flavors, and authentic atmosphere, making them ideal destinations for those looking to experience true culinary culture."
1401
+ },
1402
+ "metadata": {},
1403
+ "execution_count": 8
1404
+ }
1405
+ ]
1406
+ },
1407
+ {
1408
+ "cell_type": "code",
1409
+ "source": [
1410
+ "prompt = \"\"\"### Instruction: What are some subtle clues that suggest someone is pretending to understand a topic or conversation when they are actually confused or uninformed?\n",
1411
+ "\n",
1412
+ "### Response:\"\"\"\n",
1413
+ "\n",
1414
+ "output = get_output_batch(model, tokenizer, prompt, genConfig)\n",
1415
+ "md(output.replace(\"\\n\", \"<br />\"))"
1416
+ ],
1417
+ "metadata": {
1418
+ "colab": {
1419
+ "base_uri": "https://localhost:8080/",
1420
+ "height": 220
1421
+ },
1422
+ "id": "fiZoS83qyWP1",
1423
+ "outputId": "b31d5515-f867-45ba-caf5-f304ab2e25db"
1424
+ },
1425
+ "execution_count": 9,
1426
+ "outputs": [
1427
+ {
1428
+ "output_type": "execute_result",
1429
+ "data": {
1430
+ "text/plain": [
1431
+ "<IPython.core.display.Markdown object>"
1432
+ ],
1433
+ "text/markdown": " Here are five possible subtleties indicating that a person may be feigning comprehension on the subject matter, without really understanding it. <br />1) Avoidance of direct questions about details and specifics - This can signal that the individual does not have much information or knowledge to share but wants to appear informed in order to avoid being exposed as having limited expertise.<br />2) Speaking confidently despite gaps in their knowledge - Someone who knows little about something could try to compensate by appearing authoritative through confidence alone, perhaps using technical language or jargon in an attempt to sound like an expert even though they do not fully grasp what is being discussed. <br />3) Failure to recognize when others clarify unclear statements with further explanation – If another party clarifies ambiguous points for them repeatedly, yet the other fails to show any sign of acknowledgement or appreciation for such efforts, then this might indicate an unwillingness to engage meaningfully with contentious issues. <br />4) Attempting to divert attention away from confusing subjects - People sometimes try to change topics if things become complicated, potentially leading the listener astray while trying to protect themselves. They may mention irrelevant or tangential issues, thereby distracting"
1434
+ },
1435
+ "metadata": {},
1436
+ "execution_count": 9
1437
+ }
1438
+ ]
1439
+ },
1440
+ {
1441
+ "cell_type": "markdown",
1442
+ "source": [],
1443
+ "metadata": {
1444
+ "id": "rdIMVU3yyc-p"
1445
+ }
1446
+ },
1447
+ {
1448
+ "cell_type": "code",
1449
+ "source": [
1450
+ "prompt = \"\"\"### Instruction: What are some potential implications of using a single-use plastic bottle versus a reusable bottle on both the environment and human health?\n",
1451
+ "\n",
1452
+ "### Response:\"\"\"\n",
1453
+ "\n",
1454
+ "output = get_output_batch(model, tokenizer, prompt, genConfig)\n",
1455
+ "md(output.replace(\"\\n\", \"<br />\"))"
1456
+ ],
1457
+ "metadata": {
1458
+ "colab": {
1459
+ "base_uri": "https://localhost:8080/",
1460
+ "height": 237
1461
+ },
1462
+ "id": "8PHpk8GWydWo",
1463
+ "outputId": "db8740dc-e76e-417c-d118-1526de1541c3"
1464
+ },
1465
+ "execution_count": 10,
1466
+ "outputs": [
1467
+ {
1468
+ "output_type": "execute_result",
1469
+ "data": {
1470
+ "text/plain": [
1471
+ "<IPython.core.display.Markdown object>"
1472
+ ],
1473
+ "text/markdown": "<br />Single-Use Plastics vs. Reusables <br />The environmental impacts of using a single use plastic bottle as opposed to an eco friendly water bottles can be broken down into four main categories: landfill waste, ocean pollution, energy consumption during production, and potentially harmful chemicals used in their manufacture. By comparison with reusable options like glass or stainless steel bottles which are durable enough to last for years, there is also a financial advantage in terms of cost savings over time that comes from switching away from disposing of thousands of throwaway plastic bottles each year (often made only once before being discarded).<br /><br />Landfill Waste: Single-use plastic bottles have become synonymous with littered roadsides, parks, oceans and other areas where they take centuries to decompose and release harmful greenhouse gases throughout decomposition. Disposal of these items contributes to deforestation because paper bags must often be produced when recycling facilities cannot accept them. While certain types of plastic containers may be compostable after reuse or breakdown naturally, many of those available today do not biodegrade readily. The resultant"
1474
+ },
1475
+ "metadata": {},
1476
+ "execution_count": 10
1477
+ }
1478
+ ]
1479
+ },
1480
+ {
1481
+ "cell_type": "code",
1482
+ "source": [
1483
+ "prompt = \"\"\"### Instruction: What factors would you consider when designing an inclusive and accessible public transportation system?\n",
1484
+ "\n",
1485
+ "### Response:\"\"\"\n",
1486
+ "\n",
1487
+ "output = get_output_batch(model, tokenizer, prompt, genConfig)\n",
1488
+ "md(output.replace(\"\\n\", \"<br />\"))"
1489
+ ],
1490
+ "metadata": {
1491
+ "colab": {
1492
+ "base_uri": "https://localhost:8080/",
1493
+ "height": 237
1494
+ },
1495
+ "id": "qcsoSRAkyj8P",
1496
+ "outputId": "fe33bb34-aa1c-4c43-e31c-2f347ca96bbf"
1497
+ },
1498
+ "execution_count": 11,
1499
+ "outputs": [
1500
+ {
1501
+ "output_type": "execute_result",
1502
+ "data": {
1503
+ "text/plain": [
1504
+ "<IPython.core.display.Markdown object>"
1505
+ ],
1506
+ "text/markdown": "<br />Inclusion is important for all people, especially in terms of their access to public transport. There are several elements that can be considered when creating a more user-friendly transit service: <br /><br />1. Designed For Accessibility - All aspects related to the physical infrastructure should aim at making it easier for people with different abilities or disabilities such as wheelchairs users or vision impaired passengers, among others, to use them. This includes ensuring that the platforms, stations and vehicles have sufficient space and proper equipment (elevators, ramps etc.) to accommodate those who need it. <br />2. Accessible Information – Clear communication channels like Braille signage, tactile maps, audio announcements, videos, information kiosks or even social media pages where commuters can ask questions are essential. They allow everyone to obtain accurate and timely updates about schedule changes, delays, interruptions or other relevant events affecting services without having to rely on a third party to convey this critical information accurately. <br />3. Flexible Schedule & Routes – A flexible schedule allows riders to adapt their trips according to their needs and preferences by providing options to change routes or times during"
1507
+ },
1508
+ "metadata": {},
1509
+ "execution_count": 11
1510
+ }
1511
+ ]
1512
+ },
1513
+ {
1514
+ "cell_type": "code",
1515
+ "source": [],
1516
+ "metadata": {
1517
+ "id": "3kW93wSj2VL8"
1518
+ },
1519
+ "execution_count": 11,
1520
+ "outputs": []
1521
+ }
1522
+ ]
1523
+ }