Upload 36 files
Browse files- .gitattributes +31 -0
- MiniMind2-R1.gguf +3 -0
- MiniMind2-Small-R1.gguf +3 -0
- MiniMind2-Small.gguf +3 -0
- MiniMind2.gguf +3 -0
- Q4-MiniMind2-R1.gguf +3 -0
- Q4-MiniMind2-Small-R1.gguf +3 -0
- Q4-MiniMind2-Small.gguf +3 -0
- Q4-MiniMind2.gguf +3 -0
- README.md +0 -0
- README_en.md +0 -0
- images/1-wiki.png +3 -0
- images/2-wiki.png +0 -0
- images/3-wiki.png +3 -0
- images/4-wiki.png +3 -0
- images/5-wiki.png +3 -0
- images/LLM-structure-moe.png +3 -0
- images/LLM-structure.png +3 -0
- images/and_huggingface.png +3 -0
- images/and_modelscope.png +3 -0
- images/compare_radar.png +3 -0
- images/dataset.jpg +3 -0
- images/gpt3_config.png +0 -0
- images/logo.png +3 -0
- images/logo2.png +3 -0
- images/minimind2.gif +3 -0
- images/pre_512_loss.png +3 -0
- images/pre_768_loss.png +3 -0
- images/rope_ppl.png +3 -0
- images/sft_512_loss.png +3 -0
- images/sft_768_loss.png +3 -0
- images/train_grpo_512.png +3 -0
- images/train_grpo_768.png +3 -0
- images/train_ppo_512.png +3 -0
- images/train_ppo_768.png +3 -0
- images/train_spo_768.png +3 -0
- minimind.modelfile +11 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,34 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
images/1-wiki.png filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
images/3-wiki.png filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
images/4-wiki.png filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
images/5-wiki.png filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
images/and_huggingface.png filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
images/and_modelscope.png filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
images/compare_radar.png filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
images/dataset.jpg filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
images/LLM-structure-moe.png filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
images/LLM-structure.png filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
images/logo.png filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
images/logo2.png filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
images/minimind2.gif filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
images/pre_512_loss.png filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
images/pre_768_loss.png filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
images/rope_ppl.png filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
images/sft_512_loss.png filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
images/sft_768_loss.png filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
images/train_grpo_512.png filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
images/train_grpo_768.png filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
images/train_ppo_512.png filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
images/train_ppo_768.png filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
images/train_spo_768.png filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
MiniMind2-R1.gguf filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
MiniMind2-Small-R1.gguf filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
MiniMind2-Small.gguf filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
MiniMind2.gguf filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
Q4-MiniMind2-R1.gguf filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
Q4-MiniMind2-Small-R1.gguf filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
Q4-MiniMind2-Small.gguf filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
Q4-MiniMind2.gguf filter=lfs diff=lfs merge=lfs -text
|
MiniMind2-R1.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c405b6fa84265faa8de7e486c52fc4ad3c0d69fbd993ded7045dcbaf7a488db5
|
| 3 |
+
size 208349408
|
MiniMind2-Small-R1.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6d9e1b2cf50561e8b2551aae46b4c039996701d15c9436051c1311cfddcdefb5
|
| 3 |
+
size 51909760
|
MiniMind2-Small.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:513693600fe4463417f00b019c1d20b5fbf6edca0983ce6145bd1680bd346b21
|
| 3 |
+
size 51909696
|
MiniMind2.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5fbab733ea560088522636975993dce17c49b944a52b67afddd94d6a758982b
|
| 3 |
+
size 208349408
|
Q4-MiniMind2-R1.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97fbcc049fba5d533a85843cc4210560a745dcf6628083636d0a897d96c122ea
|
| 3 |
+
size 63656672
|
Q4-MiniMind2-Small-R1.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7b5ad59340d993533dd19bf1dc4f53a62ff06dfc6d28b1c4f3fab1d3b37052e
|
| 3 |
+
size 17506432
|
Q4-MiniMind2-Small.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:175aee237f69f00f9f70c56985cd7356d5e81e60df8151e9ae7d542414a02746
|
| 3 |
+
size 17506368
|
Q4-MiniMind2.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0e4592d6015327dbf1a71b8572284becd59e03344a3a4bc1365932ad7efa22e
|
| 3 |
+
size 63656672
|
README.md
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
README_en.md
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
images/1-wiki.png
ADDED
|
Git LFS Details
|
images/2-wiki.png
ADDED
|
images/3-wiki.png
ADDED
|
Git LFS Details
|
images/4-wiki.png
ADDED
|
Git LFS Details
|
images/5-wiki.png
ADDED
|
Git LFS Details
|
images/LLM-structure-moe.png
ADDED
|
Git LFS Details
|
images/LLM-structure.png
ADDED
|
Git LFS Details
|
images/and_huggingface.png
ADDED
|
Git LFS Details
|
images/and_modelscope.png
ADDED
|
Git LFS Details
|
images/compare_radar.png
ADDED
|
Git LFS Details
|
images/dataset.jpg
ADDED
|
Git LFS Details
|
images/gpt3_config.png
ADDED
|
images/logo.png
ADDED
|
Git LFS Details
|
images/logo2.png
ADDED
|
Git LFS Details
|
images/minimind2.gif
ADDED
|
Git LFS Details
|
images/pre_512_loss.png
ADDED
|
Git LFS Details
|
images/pre_768_loss.png
ADDED
|
Git LFS Details
|
images/rope_ppl.png
ADDED
|
Git LFS Details
|
images/sft_512_loss.png
ADDED
|
Git LFS Details
|
images/sft_768_loss.png
ADDED
|
Git LFS Details
|
images/train_grpo_512.png
ADDED
|
Git LFS Details
|
images/train_grpo_768.png
ADDED
|
Git LFS Details
|
images/train_ppo_512.png
ADDED
|
Git LFS Details
|
images/train_ppo_768.png
ADDED
|
Git LFS Details
|
images/train_spo_768.png
ADDED
|
Git LFS Details
|
minimind.modelfile
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
FROM ./Q4-MiniMind2.gguf
|
| 2 |
+
|
| 3 |
+
SYSTEM """You are a helpful assistant"""
|
| 4 |
+
|
| 5 |
+
TEMPLATE """<|im_start|>system
|
| 6 |
+
{{ .System }}<|im_end|>
|
| 7 |
+
<|im_start|>user
|
| 8 |
+
{{ .Prompt }}<|im_end|>
|
| 9 |
+
<|im_start|>assistant
|
| 10 |
+
{{ .Response }}<|im_end|>
|
| 11 |
+
"""
|