Update README.md
Browse files
README.md
CHANGED
@@ -132,23 +132,40 @@ Use the code below to get started with the model.
|
|
132 |
|
133 |
### Results
|
134 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
135 |
|
136 |
|
137 |
-
| | EN | | | | | ZH | | | JA | | |
|
138 |
-
|--------------------------|-----------|-------|-------|---------|----------|-----------|-------|--------|---------|---------|-------|
|
139 |
-
| Model | MedQA-4op | MedQA | MMLU | MedMCQA | PubMedQA | MedQA-4op | MedQA | CMExam | JJSIMQA | IgakuQA | DenQA |
|
140 |
-
| Gemma -7B | 52.92 | 47.56 | 69.74 | 48.67 | 73.44 | 48.90 | 44.55 | 38.60 | 27.61 | 35.80 | 25.14 |
|
141 |
-
| Llama2 -7B | 36.59 | 28.79 | 44.19 | 36.27 | 32.80 | 29.52 | 24.85 | 23.55 | 12.61 | 17.45 | 17.08 |
|
142 |
-
| Llama3 -8B | 58.52 | 52.76 | 70.02 | 55.25 | 75.05 | 51.42 | 44.64 | 39.41 | 28.91 | 33.20 | 23.47 |
|
143 |
-
| Swallow -8B -v0.1 | 47.87 | 45.66 | 65.87 | 49.99 | 64.39 | 47.35 | 40.84 | 35.94 | 37.83 | 45.15 | 29.03 |
|
144 |
-
| med alpaca -7B | 37.62 | 30.99 | 51.75 | 34.23 | 39.84 | 30.81 | 25.17 | 23.40 | 14.35 | 16.55 | 10.83 |
|
145 |
-
| Meditron -7B | 35.09 | 29.10 | 46.96 | 29.88 | 20.52 | 31.10 | 24.47 | 22.61 | 13.48 | 18.15 | 15.56 |
|
146 |
-
| Open BioLLM -8B | 40.14 | 50.08 | 73.15 | 56.23 | 65.39 | 50.37 | 42.59 | 24.59 | 20.87 | 31.50 | 14.44 |
|
147 |
-
| DISC -MedLLM | 37.46 | 32.89 | 50.00 | 36.96 | 33.20 | 47.18 | 46.13 | 41.57 | 23.26 | 27.15 | 23.47 |
|
148 |
-
| Apollo -7B | 54.97 | 49.68 | 68.73 | 53.48 | 75.86 | 65.19 | 60.98 | 51.40 | 25.00 | 37.40 | 24.72 |
|
149 |
-
| ELAINE -medLLM | 56.15 | 50.39 | 67.62 | 53.74 | 71.83 | 57.50 | 52.44 | 44.99 | 35.65 | 45.75 | 29.86 |
|
150 |
-
| ELAINE -medLLM -instruct | 58.36 | 55.84 | 72.79 | 54.48 | 73.24 | 61.59 | 55.71 | 47.19 | 35.22 | 46.35 | 32.36 |
|
151 |
-
|
152 |
|
153 |
#### Summary
|
154 |
|
|
|
132 |
|
133 |
### Results
|
134 |
|
135 |
+
| | EN | | | | |
|
136 |
+
|--------------------------|-----------|-------|-------|---------|----------|
|
137 |
+
| Model | MedQA-4op | MedQA | MMLU | MedMCQA | PubMedQA |
|
138 |
+
| Gemma -7B | 52.92 | 47.56 | 69.74 | 48.67 | 73.44 |
|
139 |
+
| Llama2 -7B | 36.59 | 28.79 | 44.19 | 36.27 | 32.80 |
|
140 |
+
| Llama3 -8B | 58.52 | 52.76 | 70.02 | 55.25 | 75.05 |
|
141 |
+
| Swallow -8B -v0.1 | 47.87 | 45.66 | 65.87 | 49.99 | 64.39 |
|
142 |
+
| med alpaca -7B | 37.62 | 30.99 | 51.75 | 34.23 | 39.84 |
|
143 |
+
| Meditron -7B | 35.09 | 29.10 | 46.96 | 29.88 | 20.52 |
|
144 |
+
| Open BioLLM -8B | 40.14 | 50.08 | 73.15 | 56.23 | 65.39 |
|
145 |
+
| DISC -MedLLM | 37.46 | 32.89 | 50.00 | 36.96 | 33.20 |
|
146 |
+
| Apollo -7B | 54.97 | 49.68 | 68.73 | 53.48 | 75.86 |
|
147 |
+
| ELAINE -medLLM | 56.15 | 50.39 | 67.62 | 53.74 | 71.83 |
|
148 |
+
| ELAINE -medLLM -instruct | 58.36 | 55.84 | 72.79 | 54.48 | 73.24 |
|
149 |
+
|
150 |
+
|
151 |
+
|
|
152 |
+
|
153 |
+
| | ZH | | | JA | | |
|
154 |
+
|--------------------------|-----------|-------|--------|---------|---------|-------|
|
155 |
+
| Model | MedQA-4op | MedQA | CMExam | JJSIMQA | IgakuQA | DenQA |
|
156 |
+
| Gemma -7B | 48.90 | 44.55 | 38.60 | 27.61 | 35.80 | 25.14 |
|
157 |
+
| Llama2 -7B | 29.52 | 24.85 | 23.55 | 12.61 | 17.45 | 17.08 |
|
158 |
+
| Llama3 -8B | 51.42 | 44.64 | 39.41 | 28.91 | 33.20 | 23.47 |
|
159 |
+
| Swallow -8B -v0.1 | 47.35 | 40.84 | 35.94 | 37.83 | 45.15 | 29.03 |
|
160 |
+
| med alpaca -7B | 30.81 | 25.17 | 23.40 | 14.35 | 16.55 | 10.83 |
|
161 |
+
| Meditron -7B | 31.10 | 24.47 | 22.61 | 13.48 | 18.15 | 15.56 |
|
162 |
+
| Open BioLLM -8B | 50.37 | 42.59 | 24.59 | 20.87 | 31.50 | 14.44 |
|
163 |
+
| DISC -MedLLM | 47.18 | 46.13 | 41.57 | 23.26 | 27.15 | 23.47 |
|
164 |
+
| Apollo -7B | 65.19 | 60.98 | 51.40 | 25.00 | 37.40 | 24.72 |
|
165 |
+
| ELAINE -medLLM | 57.50 | 52.44 | 44.99 | 35.65 | 45.75 | 29.86 |
|
166 |
+
| ELAINE -medLLM -instruct | 61.59 | 55.71 | 47.19 | 35.22 | 46.35 | 32.36 |
|
167 |
|
168 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
169 |
|
170 |
#### Summary
|
171 |
|