Update README.md

by m8than - opened Sep 3, 2024

base: refs/heads/main

←

from: refs/pr/1

Discussion Files changed

+11

-13

Files changed (4) hide show

.gitattributes +1 -0
README.md +8 -11
imgs/finch.jpg +0 -0
pytorch_model.bin +2 -2

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+pytorch_model.bin filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,6 +1,3 @@
----
-license: apache-2.0
----
 ### Huggingface RWKV Finch 14B Model
 > HF compatible model for Finch-14B.
@@ -26,7 +23,7 @@ tokenizer = AutoTokenizer.from_pretrained("RWKV/v6-Finch-14B-HF", trust_remote_c
 The following demonstrates the improvements from Eagle 7B to Finch 14B
-|  | [Eagle 7B](https://huggingface.co/RWKV/v6-Finch-14B-HF) | [Finch 7B](https://huggingface.co/RWKV/v6-Finch-7B-HF) | [Finch 14B](https://huggingface.co/RWKV/v6-Finch-14B-HF) |
 | --- | --- | --- | --- |
 | [ARC](https://github.com/EleutherAI/lm-evaluation-harness/tree/main/lm_eval/tasks/arc) | 39.59% | 41.47% | 46.33% |
 | [HellaSwag](https://github.com/EleutherAI/lm-evaluation-harness/tree/main/lm_eval/tasks/hellaswag) | 53.09% | 55.96% | 57.69% |
@@ -59,8 +56,8 @@ User: {instruction}
 Assistant:"""
-model = AutoModelForCausalLM.from_pretrained("RWKV/v6-Finch-14B-HF", trust_remote_code=True).to(torch.float32)
-tokenizer = AutoTokenizer.from_pretrained("RWKV/v6-Finch-14B-HF", trust_remote_code=True)
 text = "请介绍北京的旅游景点"
 prompt = generate_prompt(text)
@@ -115,8 +112,8 @@ User: {instruction}
 Assistant:"""
-model = AutoModelForCausalLM.from_pretrained("RWKV/v6-Finch-14B-HF", trust_remote_code=True, torch_dtype=torch.float16).to(0)
-tokenizer = AutoTokenizer.from_pretrained("RWKV/v6-Finch-14B-HF", trust_remote_code=True)
 text = "介绍一下大熊猫"
 prompt = generate_prompt(text)
@@ -162,8 +159,8 @@ User: {instruction}
 Assistant:"""
-model = AutoModelForCausalLM.from_pretrained("RWKV/v6-Finch-14B-HF", trust_remote_code=True).to(torch.float32)
-tokenizer = AutoTokenizer.from_pretrained("RWKV/v6-Finch-14B-HF", trust_remote_code=True)
 texts = ["请介绍北京的旅游景点", "介绍一下大熊猫", "乌兰察布"]
 prompts = [generate_prompt(text) for text in texts]
@@ -214,6 +211,6 @@ Assistant: 乌兰察布是中国新疆维吾尔自治区的一个县级市，位
 ## Acknowledgement
 We are grateful for the help and support from the following key groups:
-- [Recursal.ai](https://recursal.ai) team for financing the GPU resources, and managing the training of this foundation model - you can run the Finch line of RWKV models on their cloud / on-premise platform today.
 - EleutherAI for their support, especially in the v5/v6 Eagle/Finch paper
 - Linux Foundation AI & Data group for supporting and hosting the RWKV project

 ### Huggingface RWKV Finch 14B Model
 > HF compatible model for Finch-14B.
 The following demonstrates the improvements from Eagle 7B to Finch 14B
+|  | [Eagle 7B](https://huggingface.co/RWKV/v5-Eagle-7B-HF) | [Finch 7B](https://huggingface.co/RWKV/v6-Finch-7B-HF) | [Finch 14B](https://huggingface.co/RWKV/v6-Finch-14B-HF) |
 | --- | --- | --- | --- |
 | [ARC](https://github.com/EleutherAI/lm-evaluation-harness/tree/main/lm_eval/tasks/arc) | 39.59% | 41.47% | 46.33% |
 | [HellaSwag](https://github.com/EleutherAI/lm-evaluation-harness/tree/main/lm_eval/tasks/hellaswag) | 53.09% | 55.96% | 57.69% |
 Assistant:"""
+model = AutoModelForCausalLM.from_pretrained("RWKV/v5-Eagle-7B-HF", trust_remote_code=True).to(torch.float32)
+tokenizer = AutoTokenizer.from_pretrained("RWKV/v5-Eagle-7B-HF", trust_remote_code=True)
 text = "请介绍北京的旅游景点"
 prompt = generate_prompt(text)
 Assistant:"""
+model = AutoModelForCausalLM.from_pretrained("RWKV/v5-Eagle-7B-HF", trust_remote_code=True, torch_dtype=torch.float16).to(0)
+tokenizer = AutoTokenizer.from_pretrained("RWKV/v5-Eagle-7B-HF", trust_remote_code=True)
 text = "介绍一下大熊猫"
 prompt = generate_prompt(text)
 Assistant:"""
+model = AutoModelForCausalLM.from_pretrained("RWKV/v5-Eagle-7B-HF", trust_remote_code=True).to(torch.float32)
+tokenizer = AutoTokenizer.from_pretrained("RWKV/v5-Eagle-7B-HF", trust_remote_code=True)
 texts = ["请介绍北京的旅游景点", "介绍一下大熊猫", "乌兰察布"]
 prompts = [generate_prompt(text) for text in texts]
 ## Acknowledgement
 We are grateful for the help and support from the following key groups:
+- [Recursal.ai](https://recursal.ai) team for financing the GPU resources, and managing the training of this foundation model - you can run the Eagle line of RWKV models on their cloud / on-premise platform today.
 - EleutherAI for their support, especially in the v5/v6 Eagle/Finch paper
 - Linux Foundation AI & Data group for supporting and hosting the RWKV project

imgs/finch.jpg DELETED Viewed

Binary file (315 kB)

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f5f3477146b7dc0e68a1e64faac1e3b87a257d10f69a0078908d8d9bce6aaae9
-size 28138382794

 version https://git-lfs.github.com/spec/v1
+oid sha256:d8fd6a260cf910c13729c34109b47c4f28ec009764c79a25f8b35cf853997415
+size 28138382858