From aafaaf937f3b78406f13f44c471c33812db32ba3 Mon Sep 17 00:00:00 2001 From: xusenlin Date: Fri, 11 Aug 2023 11:41:40 +0800 Subject: [PATCH] Fix typo --- api/patches.py | 2 +- docs/SCRIPT.md | 18 ------------------ 2 files changed, 1 insertion(+), 19 deletions(-) diff --git a/api/patches.py b/api/patches.py index 574639a..f0f56d7 100644 --- a/api/patches.py +++ b/api/patches.py @@ -165,4 +165,4 @@ def apply_rerope_patch(training_length: int = 4096, window_size: int = 512): global TRAINING_LENGTH, WINDOW_SIZE TRAINING_LENGTH, WINDOW_SIZE = training_length, window_size LlamaAttention.forward = forward_with_rerope - logger.info(f"Apply NTK scaling with TRAINING_LENGTH={TRAINING_LENGTH}") + logger.info(f"Apply ReRoPE with TRAINING_LENGTH={TRAINING_LENGTH}") diff --git a/docs/SCRIPT.md b/docs/SCRIPT.md index dba6184..a428df1 100644 --- a/docs/SCRIPT.md +++ b/docs/SCRIPT.md @@ -325,24 +325,6 @@ docker run -it -d --gpus all --ipc=host --net=host -p 80:80 --name=aquila-chat-7 --embedding_name moka-ai/m3e-base ``` -### NewHope - -SLAM-group/NewHope: - -```shell -docker run -it -d --gpus all --ipc=host --net=host -p 80:80 --name=newhope \ - --ulimit memlock=-1 --ulimit stack=67108864 \ - -v `pwd`:/workspace \ - llm-api:pytorch \ - python api/app.py \ - --port 80 \ - --allow-credentials \ - --model_name newhope \ - --model_path SLAM-group/NewHope \ - --device cuda \ - --embedding_name moka-ai/m3e-base -``` - ### Qwen-7b-chat 除已有的环境之外,推荐安装下面的依赖以提高运行效率和降低显存占用