{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "ebcf3daa-78ce-4baa-846a-ea5e298c9de5", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\u001b[33mWARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv\u001b[0m\u001b[33m\n", "\u001b[0mNote: you may need to restart the kernel to use updated packages.\n" ] } ], "source": [ "pip install -q datasets trl peft bitsandbytes sentencepiece wandb huggingface_hub" ] }, { "cell_type": "code", "execution_count": 1, "id": "4d54dddd-dfda-481a-95d4-79d1525524c4", "metadata": {}, "outputs": [ { "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "a9bddf0a36c64d3f9c6d4a58c3d59282", "version_major": 2, "version_minor": 0 }, "text/plain": [ "VBox(children=(HTML(value='
/workspace/wandb/run-20240128_065712-os8qoadz
"
],
"text/plain": [
"Step | \n", "Training Loss | \n", "
---|---|
1 | \n", "0.703000 | \n", "
2 | \n", "0.698300 | \n", "
3 | \n", "0.703000 | \n", "
4 | \n", "0.675100 | \n", "
5 | \n", "0.694200 | \n", "
6 | \n", "0.675100 | \n", "
7 | \n", "0.675300 | \n", "
8 | \n", "0.658600 | \n", "
9 | \n", "0.641100 | \n", "
10 | \n", "0.634400 | \n", "
11 | \n", "0.609300 | \n", "
12 | \n", "0.606500 | \n", "
13 | \n", "0.607200 | \n", "
14 | \n", "0.560900 | \n", "
15 | \n", "0.563000 | \n", "
16 | \n", "0.527200 | \n", "
17 | \n", "0.473300 | \n", "
18 | \n", "0.486900 | \n", "
19 | \n", "0.454200 | \n", "
20 | \n", "0.426300 | \n", "
21 | \n", "0.381000 | \n", "
22 | \n", "0.361900 | \n", "
23 | \n", "0.344100 | \n", "
24 | \n", "0.298400 | \n", "
25 | \n", "0.298100 | \n", "
26 | \n", "0.256600 | \n", "
27 | \n", "0.245600 | \n", "
28 | \n", "0.214800 | \n", "
29 | \n", "0.190200 | \n", "
30 | \n", "0.163100 | \n", "
31 | \n", "0.148100 | \n", "
32 | \n", "0.136700 | \n", "
33 | \n", "0.117100 | \n", "
34 | \n", "0.097800 | \n", "
35 | \n", "0.105300 | \n", "
36 | \n", "0.072300 | \n", "
37 | \n", "0.077200 | \n", "
38 | \n", "0.056100 | \n", "
39 | \n", "0.051000 | \n", "
40 | \n", "0.041900 | \n", "
41 | \n", "0.035800 | \n", "
42 | \n", "0.031700 | \n", "
43 | \n", "0.013200 | \n", "
44 | \n", "0.014600 | \n", "
45 | \n", "0.036300 | \n", "
46 | \n", "0.012200 | \n", "
47 | \n", "0.012500 | \n", "
48 | \n", "0.011200 | \n", "
49 | \n", "0.013500 | \n", "
50 | \n", "0.008400 | \n", "
51 | \n", "0.004900 | \n", "
52 | \n", "0.006900 | \n", "
53 | \n", "0.010800 | \n", "
54 | \n", "0.006800 | \n", "
55 | \n", "0.003900 | \n", "
56 | \n", "0.005600 | \n", "
57 | \n", "0.002100 | \n", "
58 | \n", "0.001800 | \n", "
59 | \n", "0.004600 | \n", "
60 | \n", "0.001600 | \n", "
61 | \n", "0.002000 | \n", "
62 | \n", "0.001400 | \n", "
63 | \n", "0.001000 | \n", "
64 | \n", "0.002900 | \n", "
65 | \n", "0.000800 | \n", "
66 | \n", "0.004300 | \n", "
67 | \n", "0.000700 | \n", "
68 | \n", "0.002700 | \n", "
69 | \n", "0.000500 | \n", "
70 | \n", "0.002600 | \n", "
71 | \n", "0.000600 | \n", "
72 | \n", "0.000400 | \n", "
73 | \n", "0.000800 | \n", "
74 | \n", "0.000700 | \n", "
75 | \n", "0.000400 | \n", "
76 | \n", "0.000600 | \n", "
77 | \n", "0.000900 | \n", "
78 | \n", "0.000300 | \n", "
79 | \n", "0.001000 | \n", "
80 | \n", "0.000300 | \n", "
81 | \n", "0.002800 | \n", "
82 | \n", "0.000900 | \n", "
83 | \n", "0.000300 | \n", "
84 | \n", "0.000200 | \n", "
85 | \n", "0.000300 | \n", "
86 | \n", "0.010300 | \n", "
87 | \n", "0.001800 | \n", "
88 | \n", "0.000400 | \n", "
89 | \n", "0.000300 | \n", "
90 | \n", "0.000200 | \n", "
"
],
"text/plain": [
"