Update README.md
Browse files
README.md
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
---
|
2 |
activation_function: gelu_new
|
3 |
architectures:
|
4 |
-
- GPT2LMHeadModel
|
5 |
attn_pdrop: 0.1
|
6 |
bos_token_id: 50256
|
7 |
embd_pdrop: 0.1
|
@@ -23,20 +23,26 @@ summary_proj_to_labels: true
|
|
23 |
summary_type: cls_index
|
24 |
summary_use_proj: true
|
25 |
task_specific_params:
|
26 |
-
|
27 |
-
|
28 |
-
|
29 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
30 |
language:
|
31 |
-
- en
|
32 |
tags:
|
33 |
-
-
|
34 |
metrics:
|
35 |
-
-
|
36 |
-
|
37 |
-
datasets:
|
38 |
-
- blended_skill_talk
|
39 |
-
license: apache-2.0
|
40 |
custom_params:
|
41 |
adaptation_rate: 0.05
|
42 |
complexity_metric: null
|
@@ -73,7 +79,6 @@ max_top_n_tokens: 5
|
|
73 |
waiting_served_ratio: 1.2
|
74 |
max_batch_prefill_tokens: 2048
|
75 |
max_waiting_tokens: 200
|
76 |
-
pipeline_tag: text-generation
|
77 |
---
|
78 |
---
|
79 |
## Phillnet Large 🚀
|
|
|
1 |
---
|
2 |
activation_function: gelu_new
|
3 |
architectures:
|
4 |
+
- GPT2LMHeadModel
|
5 |
attn_pdrop: 0.1
|
6 |
bos_token_id: 50256
|
7 |
embd_pdrop: 0.1
|
|
|
23 |
summary_type: cls_index
|
24 |
summary_use_proj: true
|
25 |
task_specific_params:
|
26 |
+
conversational:
|
27 |
+
max_length: 1024
|
28 |
+
min_length: 20
|
29 |
+
length_penalty: 1.5
|
30 |
+
num_beams: 5
|
31 |
+
early_stopping: true
|
32 |
+
no_repeat_ngram_size: 3
|
33 |
+
temperature: 0.7
|
34 |
+
top_k: 50
|
35 |
+
top_p: 0.9
|
36 |
+
license: apache-2.0
|
37 |
+
datasets:
|
38 |
+
- vicgalle/alpaca-gpt4
|
39 |
language:
|
40 |
+
- en
|
41 |
tags:
|
42 |
+
- conversational
|
43 |
metrics:
|
44 |
+
- perplexity
|
45 |
+
- accuracy
|
|
|
|
|
|
|
46 |
custom_params:
|
47 |
adaptation_rate: 0.05
|
48 |
complexity_metric: null
|
|
|
79 |
waiting_served_ratio: 1.2
|
80 |
max_batch_prefill_tokens: 2048
|
81 |
max_waiting_tokens: 200
|
|
|
82 |
---
|
83 |
---
|
84 |
## Phillnet Large 🚀
|