diff --git a/README.md b/README.md
index 93bb9a3..260c195 100644
--- a/README.md
+++ b/README.md
@@ -106,7 +106,7 @@ https://github.com/user-attachments/assets/88b98128-636e-43bc-a419-b1b1403c2055
* CUDA == 12.2
* [requirements.txt](./requirements.txt)
-# 📌 Deployment & Inference
+# 📌 Quick Inference & Test

@@ -174,15 +174,13 @@ streamlit run fast_inference.py
│  ├── full_sft_512.pth
│  ├── full_sft_640_moe.pth
│  └── full_sft_640.pth
+ │  └── full_sft_768.pth
├── single_chat
│  ├── full_sft_1024.pth
│  ├── full_sft_512.pth
│  ├── full_sft_640_moe.pth
│  └── full_sft_640.pth
- ├── full_sft_1024.pth
- ├── full_sft_512.pth
- ├── full_sft_640_moe.pth
- ├── full_sft_640.pth
+ │  └── full_sft_768.pth
├── pretrain_1024.pth
├── pretrain_640_moe.pth
├── pretrain_640.pth
diff --git a/README_en.md b/README_en.md
index 0598c58..465fd12 100644
--- a/README_en.md
+++ b/README_en.md
@@ -114,7 +114,7 @@ These are my personal software and hardware environment configurations. Please a
* CUDA == 12.2
* [requirements.txt](./requirements.txt)
-# 📌 Deployment & Inference
+# 📌 Quick Inference & Test

@@ -192,15 +192,13 @@ git clone https://github.com/jingyaogong/minimind.git
│  ├── full_sft_512.pth
│  ├── full_sft_640_moe.pth
│  └── full_sft_640.pth
+ │  └── full_sft_768.pth
├── single_chat
│  ├── full_sft_1024.pth
│  ├── full_sft_512.pth
│  ├── full_sft_640_moe.pth
│  └── full_sft_640.pth
- ├── full_sft_1024.pth
- ├── full_sft_512.pth
- ├── full_sft_640_moe.pth
- ├── full_sft_640.pth
+ │  └── full_sft_768.pth
├── pretrain_1024.pth
├── pretrain_640_moe.pth
├── pretrain_640.pth