From 5c7bd51840baeec3e7ce1d9eb6542a3841912c56 Mon Sep 17 00:00:00 2001 From: dengsgo Date: Sun, 2 Jul 2023 16:58:05 +0800 Subject: [PATCH 1/4] add dockerfile Support --- Dockerfile | 17 +++++++++++++++++ web_demo.py | 2 +- 2 files changed, 18 insertions(+), 1 deletion(-) create mode 100644 Dockerfile diff --git a/Dockerfile b/Dockerfile new file mode 100644 index 0000000..d99659e --- /dev/null +++ b/Dockerfile @@ -0,0 +1,17 @@ +## use pytorch images +FROM pytorch/pytorch:2.0.1-cuda11.7-cudnn8-runtime +## copy all files +COPY . . +## install tools +RUN apt update && apt install -y git gcc +## install requirements and cudatoolkit +RUN pip install -r requirements.txt -i https://pypi.tuna.tsinghua.edu.cn/simple/ && \ +pip install icetk -i https://pypi.tuna.tsinghua.edu.cn/simple/ && \ +conda install cudatoolkit=11.7 -c nvidia +## expose port +EXPOSE 7860 +## run +CMD [ "python3","web_demo.py" ] + +## command for docker run +## docker run --rm -it -v /path/to/chatglm2-6b-int4:/workspace/THUDM/chatglm2-6b --gpus=all -e NVIDIA_DRIVER_CAPABILITIES=compute,utility -e NVIDIA_VISIBLE_DEVICES=all -p 7860:7860 chatglm2:v1 python3 web_demo.py \ No newline at end of file diff --git a/web_demo.py b/web_demo.py index 1af24c9..f019d1f 100644 --- a/web_demo.py +++ b/web_demo.py @@ -105,4 +105,4 @@ def reset_state(): emptyBtn.click(reset_state, outputs=[chatbot, history, past_key_values], show_progress=True) -demo.queue().launch(share=False, inbrowser=True) +demo.queue().launch(share=False, inbrowser=True, server_name="0.0.0.0") From b32ea6ce46aa2a78b7d038353a730265ec28439b Mon Sep 17 00:00:00 2001 From: dengsgo Date: Sun, 2 Jul 2023 17:06:14 +0800 Subject: [PATCH 2/4] update docker run --- Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Dockerfile b/Dockerfile index d99659e..15468f4 100644 --- a/Dockerfile +++ b/Dockerfile @@ -14,4 +14,4 @@ EXPOSE 7860 CMD [ "python3","web_demo.py" ] ## command for docker run -## docker run --rm -it -v /path/to/chatglm2-6b-int4:/workspace/THUDM/chatglm2-6b --gpus=all -e NVIDIA_DRIVER_CAPABILITIES=compute,utility -e NVIDIA_VISIBLE_DEVICES=all -p 7860:7860 chatglm2:v1 python3 web_demo.py \ No newline at end of file +## docker run --rm -it -v /home/dengsgo/models/chatglm2-6b-int4:/workspace/THUDM/chatglm2-6b --gpus=all -e NVIDIA_DRIVER_CAPABILITIES=compute,utility -e NVIDIA_VISIBLE_DEVICES=all -p 7860:7860 chatglm2:v1 \ No newline at end of file From f80ab7e579f82668e158ce1b253e9e2b3d7953d7 Mon Sep 17 00:00:00 2001 From: dengsgo Date: Sun, 2 Jul 2023 17:10:21 +0800 Subject: [PATCH 3/4] add label --- Dockerfile | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/Dockerfile b/Dockerfile index 15468f4..c09ff79 100644 --- a/Dockerfile +++ b/Dockerfile @@ -1,5 +1,9 @@ ## use pytorch images FROM pytorch/pytorch:2.0.1-cuda11.7-cudnn8-runtime +## lables +LABEL version="v1" +LABEL description="chatglm2-6b docker images" +LABEL maintainer="dengsgo[https://github.com/dengsgo]" ## copy all files COPY . . ## install tools From e36c12ad5664e5af16c9d5bb5eab556083a7d8e4 Mon Sep 17 00:00:00 2001 From: dengsgo Date: Sun, 2 Jul 2023 17:40:00 +0800 Subject: [PATCH 4/4] add Docker webUI doc --- README.md | 9 +++++++++ 1 file changed, 9 insertions(+) diff --git a/README.md b/README.md index cea2461..32831c8 100644 --- a/README.md +++ b/README.md @@ -131,6 +131,15 @@ cd ChatGLM2-6B 然后使用 pip 安装依赖:`pip install -r requirements.txt`,其中 `transformers` 库版本推荐为 `4.30.2`,`torch` 推荐使用 2.0 以上的版本,以获得最佳的推理性能。 +### Docker webUI +首先需要下载本仓库: +```shell +git clone https://github.com/THUDM/ChatGLM2-6B +cd ChatGLM2-6B +docker build -t chatglm2:v1 . +docker run --rm -it -v /home/dengsgo/models/chatglm2-6b-int4:/workspace/THUDM/chatglm2-6b --gpus=all -e NVIDIA_DRIVER_CAPABILITIES=compute,utility -e NVIDIA_VISIBLE_DEVICES=all -p 7860:7860 chatglm2:v1 +``` + ### 代码调用 可以通过如下代码调用 ChatGLM2-6B 模型来生成对话: