update model

This commit is contained in:
gongjy 2024-09-16 15:29:57 +08:00
parent e1f68b5e37
commit e4ad822c40
4 changed files with 16 additions and 20 deletions

View File

@ -152,7 +152,7 @@ streamlit run fast_inference.py
* 0、环境安装 * 0、环境安装
```bash ```bash
pip install -r requirements.txt pip install -r requirements.txt -i https://pypi.tuna.tsinghua.edu.cn/simple
``` ```
* 1、克隆项目代码 * 1、克隆项目代码
```text ```text
@ -702,10 +702,11 @@ minimind模型本身没有使用较大的数据集训练也没有针对回答
## 🤝[贡献者](https://github.com/jingyaogong/minimind/graphs/contributors) ## 🤝[贡献者](https://github.com/jingyaogong/minimind/graphs/contributors)
[//]: # (<br/>) <!--
[//]: # (<a href="https://github.com/jingyaogong/minimind/graphs/contributors">) <a href="https://github.com/jingyaogong/minimind/graphs/contributors">
[//]: # ( <img src="https://contrib.rocks/image?repo=jingyaogong/minimind&v=3" />) <img src="https://contrib.rocks/image?repo=jingyaogong/minimind&v3" />
[//]: # (</a>) </a>
-->
<a href="https://github.com/jingyaogong"><img src="https://avatars.githubusercontent.com/u/62287848" width="70px" height="70px"/></a>&nbsp; <a href="https://github.com/jingyaogong"><img src="https://avatars.githubusercontent.com/u/62287848" width="70px" height="70px"/></a>&nbsp;
<a href="https://github.com/MuWinds"><img src="https://avatars.githubusercontent.com/u/93832089" width="70px" height="70px"/></a>&nbsp; <a href="https://github.com/MuWinds"><img src="https://avatars.githubusercontent.com/u/93832089" width="70px" height="70px"/></a>&nbsp;

View File

@ -779,20 +779,16 @@ your model with third-party UIs, such as fastgpt, OpenWebUI, etc.
## 🤝[Contributors](https://github.com/jingyaogong/minimind/graphs/contributors) ## 🤝[Contributors](https://github.com/jingyaogong/minimind/graphs/contributors)
[//]: # (<br/>) <!--
<a href="https://github.com/jingyaogong/minimind/graphs/contributors">
<img src="https://contrib.rocks/image?repo=jingyaogong/minimind&v3" />
</a>
-->
[//]: # (<a href="https://github.com/jingyaogong/minimind/graphs/contributors">) <a href="https://github.com/jingyaogong"><img src="https://avatars.githubusercontent.com/u/62287848" width="70px" height="70px"/></a>&nbsp;
<a href="https://github.com/MuWinds"><img src="https://avatars.githubusercontent.com/u/93832089" width="70px" height="70px"/></a>&nbsp;
<a href="https://github.com/chuanzhubin"><img src="https://avatars.githubusercontent.com/u/2813798" width="70px" height="70px"/></a>&nbsp;
[//]: # ( <img src="https://contrib.rocks/image?repo=jingyaogong/minimind&v=3" />)
[//]: # (</a>)
<a href="https://github.com/jingyaogong"><img src="https://avatars.githubusercontent.com/u/62287848" width="70px" height="70px"/></a>
&nbsp;
<a href="https://github.com/MuWinds"><img src="https://avatars.githubusercontent.com/u/93832089" width="70px" height="70px"/></a>
&nbsp;
<a href="https://github.com/chuanzhubin"><img src="https://avatars.githubusercontent.com/u/2813798" width="70px" height="70px"/></a>
&nbsp;
## 😊Thanks for ## 😊Thanks for

View File

@ -17,7 +17,7 @@ class LMConfig(PretrainedConfig):
norm_eps: float = 1e-5, norm_eps: float = 1e-5,
max_seq_len: int = 512, max_seq_len: int = 512,
dropout: float = 0.0, dropout: float = 0.0,
flash_attn: bool = False, flash_attn: bool = True,
#################################################### ####################################################
# Here are the specific configurations of MOE # Here are the specific configurations of MOE
# When use_moe is false, the following is invalid # When use_moe is false, the following is invalid

View File

@ -1,6 +1,5 @@
datasets==2.16.1 datasets==2.16.1
datasketch==1.6.4 datasketch==1.6.4
flash_attn==2.5.0
Flask==3.0.3 Flask==3.0.3
Flask_Cors==4.0.0 Flask_Cors==4.0.0
jieba==0.42.1 jieba==0.42.1
@ -20,7 +19,7 @@ scikit_learn==1.5.1
sentence_transformers==2.3.1 sentence_transformers==2.3.1
simhash==2.1.2 simhash==2.1.2
tiktoken==0.5.1 tiktoken==0.5.1
torch==2.1.2+cu121 torch==2.1.2
transformers==4.44.0 transformers==4.44.0
jinja2==3.1.2 jinja2==3.1.2
jsonlines==4.0.0 jsonlines==4.0.0