From 23a167f4145cf003bdf13a9a2f4c18a8ee3db6b7 Mon Sep 17 00:00:00 2001 From: xxl <505279206@qq.com> Date: Mon, 13 Jan 2025 11:55:54 +0800 Subject: [PATCH] first commit --- README.md | 97 ++++++++++++++++++- ...-x070-World-0.1B-v2.8-20241210-ctx4096.pth | 3 + ...-x070-World-0.4B-v2.9-20250107-ctx4096.pth | 3 + configuration.json | 1 + 4 files changed, 102 insertions(+), 2 deletions(-) create mode 100644 RWKV-x070-World-0.1B-v2.8-20241210-ctx4096.pth create mode 100644 RWKV-x070-World-0.4B-v2.9-20250107-ctx4096.pth create mode 100644 configuration.json diff --git a/README.md b/README.md index ae71928..83d6da9 100644 --- a/README.md +++ b/README.md @@ -1,3 +1,96 @@ -# rwkv-7-world +--- +language: +- en +- zh +- fr +- es +- de +- pt +- ru +- it +- ja +- ko +- vi +- ar +tags: +- pytorch +- text-generation +- causal-lm +- rwkv +license: apache-2.0 +datasets: +- HuggingFaceFW/fineweb-edu +- mlfoundations/dclm-baseline-1.0 +- cerebras/SlimPajama-627B +- EleutherAI/pile +- bigcode/starcoderdata +- oscar-corpus/OSCAR-2301 +--- -rwkv-7-world \ No newline at end of file +# RWKV-7 World + +Use rwkv pip package 0.8.28+ for RWKV-7 inference: https://pypi.org/project/rwkv/ + +Evals and more information: https://www.rwkv.com/ + +For developers: https://github.com/BlinkDL/RWKV-LM/tree/main/RWKV-v7 + +Chat demo: https://github.com/BlinkDL/ChatRWKV/blob/main/API_DEMO_CHAT.py + +## Model Description + +RWKV-7 trained on 100+ world languages (80% English, 10% multilang, 10% code). + +World-v3 = 3.1T tokens + +World-v2.9 = subsampled 2T tokens + +World-v2.8 = subsampled 1T tokens + +Recommended fine-tuning format (use \n for newlines): +``` +User: xxxxxxxxxxxxxxx + +Assistant: xxxxxxxxxxxxxxx +xxxxxxxxxxxxxxx +xxxxxxxxxxxxxxx + +User: xxxxxxxxxxxxxxx +xxxxxxxxxxxxxxx + +Assistant: xxxxxxxxxxxxxxx +xxxxxxxxxxxxxxx +xxxxxxxxxxxxxxx +xxxxxxxxxxxxxxx +``` + +A good chat prompt (better replace \n\n in xxx to \n, such that there will never be extra \n\n in response): +``` +User: hi + +Assistant: Hi. I am your assistant and I will provide expert full response in full details. Please feel free to ask any question and I will always answer it. + +User: xxx + +Assistant: +``` +QA prompt (better replace \n\n in xxx to \n, such that there will never be extra \n\n in response): +``` +Question: xxx + +Answer: +``` +and +``` +Instruction: xxx + +Input: xxx + +Response: +``` + +!!! There should not be any space after your final ":" or you will upset the tokenizer and see non-English reponse !!! + +!!! There should not be any space after your final ":" or you will upset the tokenizer and see non-English reponse !!! + +!!! There should not be any space after your final ":" or you will upset the tokenizer and see non-English reponse !!! \ No newline at end of file diff --git a/RWKV-x070-World-0.1B-v2.8-20241210-ctx4096.pth b/RWKV-x070-World-0.1B-v2.8-20241210-ctx4096.pth new file mode 100644 index 0000000..bfafd0e --- /dev/null +++ b/RWKV-x070-World-0.1B-v2.8-20241210-ctx4096.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60c98129b9529963bff2c164b8ab4bd17c19332ae06dc2dcae32aa3a3739295a +size 382195690 diff --git a/RWKV-x070-World-0.4B-v2.9-20250107-ctx4096.pth b/RWKV-x070-World-0.4B-v2.9-20250107-ctx4096.pth new file mode 100644 index 0000000..357daf3 --- /dev/null +++ b/RWKV-x070-World-0.4B-v2.9-20250107-ctx4096.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c08cf602b33e59a5717b8f0cafaf7f04c50c1c67166e477aa2f47c5ca180da4a +size 901794466 diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..f9291c3 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework":"Pytorch","task":"text-generation"} \ No newline at end of file