Update README.md
Browse files
README.md
CHANGED
@@ -56,25 +56,13 @@ Here we list our data distribution in each stage:
|
|
56 |
|
57 |
| Corpus | Basic pretraining | Continual pretraining with specific domain | Cooldown |
|
58 |
| ------------- | ----------------- | ------------------------------------------ | -------- |
|
59 |
-
|
|
60 |
-
| C4 | 35.0 | 35.0 | 35.0 |
|
61 |
-
| CommonCrawl | 70.1 | 70.1 | 70.1 |
|
62 |
-
| Github | 6.5 | 6.5 | 6.5 |
|
63 |
-
| StackExchange | 4.2 | 4.2 | 4.2 |
|
64 |
-
| ArXiv | 5.7 | 5.7 | 5.7 |
|
65 |
-
| Wikipedia | 4.5 | 4.5 | 4.5 |
|
66 |
|
67 |
### TinyLlama_v1.1_math_code
|
68 |
|
69 |
| Corpus | Basic pretraining | Continual pretraining with specific domain | Cooldown |
|
70 |
| ------------- | ----------------- | ------------------------------------------ | -------- |
|
71 |
-
|
|
72 |
-
| C4 | 35.0 | 21.6 | 21.6 |
|
73 |
-
| CommonCrawl | 70.1 | 43.0 | 43.0 |
|
74 |
-
| Github | 6.5 | - | - |
|
75 |
-
| StackExchange | 4.2 | 2.6 | 2.6 |
|
76 |
-
| ArXiv | 5.7 | 5.0 | 5.0 |
|
77 |
-
| Wikipedia | 4.5 | 2.8 | 2.8 |
|
78 |
| starcoder | - | 15.0 | 15.0 |
|
79 |
| proof_pile | - | 10.0 | 10.0 |
|
80 |
|
@@ -82,13 +70,7 @@ Here we list our data distribution in each stage:
|
|
82 |
|
83 |
| orpus | Basic pretraining | Continual pretraining with specific domain | Cooldown |
|
84 |
| ------------- | ----------------- | ------------------------------------------ | -------- |
|
85 |
-
|
|
86 |
-
| C4 | 35.0 | 14.6 | 14.6 |
|
87 |
-
| CommonCrawl | 70.1 | 29.3 | 29.3 |
|
88 |
-
| Github | 6.5 | - | - |
|
89 |
-
| StackExchange | 4.2 | 1.8 | 1.8 |
|
90 |
-
| ArXiv | 5.7 | 2.4 | 2.4 |
|
91 |
-
| Wikipedia | 4.5 | 1.9 | 1.9 |
|
92 |
| skypile | - | 50.0 | 50.0 |
|
93 |
|
94 |
### How to use
|
|
|
56 |
|
57 |
| Corpus | Basic pretraining | Continual pretraining with specific domain | Cooldown |
|
58 |
| ------------- | ----------------- | ------------------------------------------ | -------- |
|
59 |
+
| Slimpajama | 100.0 | 100.0 | 100.0 |
|
|
|
|
|
|
|
|
|
|
|
|
|
60 |
|
61 |
### TinyLlama_v1.1_math_code
|
62 |
|
63 |
| Corpus | Basic pretraining | Continual pretraining with specific domain | Cooldown |
|
64 |
| ------------- | ----------------- | ------------------------------------------ | -------- |
|
65 |
+
| Slimpajama | 100.0 | 75.0 | 75.0 |
|
|
|
|
|
|
|
|
|
|
|
|
|
66 |
| starcoder | - | 15.0 | 15.0 |
|
67 |
| proof_pile | - | 10.0 | 10.0 |
|
68 |
|
|
|
70 |
|
71 |
| orpus | Basic pretraining | Continual pretraining with specific domain | Cooldown |
|
72 |
| ------------- | ----------------- | ------------------------------------------ | -------- |
|
73 |
+
| Slimpajama | 100.0 | 50.0 | 50.0 |
|
|
|
|
|
|
|
|
|
|
|
|
|
74 |
| skypile | - | 50.0 | 50.0 |
|
75 |
|
76 |
### How to use
|