init🎉:
This commit is contained in:
		
							
								
								
									
										2
									
								
								.gitignore
									
									
									
									
										vendored
									
									
										Normal file
									
								
							
							
						
						
									
										2
									
								
								.gitignore
									
									
									
									
										vendored
									
									
										Normal file
									
								
							| @ -0,0 +1,2 @@ | ||||
| tests/ | ||||
| qwen_deploy/ | ||||
							
								
								
									
										31
									
								
								docker/Dockerfile
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										31
									
								
								docker/Dockerfile
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,31 @@ | ||||
| FROM pytorch/pytorch:2.1.2-cuda12.1-cudnn8-devel | ||||
|  | ||||
| ARG PIP_SOURCE=https://pypi.tuna.tsinghua.edu.cn/simple | ||||
| ARG BUILD_TMP=/build_tmp | ||||
|  | ||||
| RUN mkdir $BUILD_TMP | ||||
|  | ||||
| # install basic dependencies | ||||
| COPY sources.list /etc/apt/sources.list | ||||
| RUN apt-get clean all && apt-get update && apt-get install -y --no-install-recommends \ | ||||
|     python3.8 \ | ||||
|     git \ | ||||
|     curl \ | ||||
|     wget | ||||
|  | ||||
| # install python requirements | ||||
| RUN pip install flash-attn==2.4.2 --no-build-isolation | ||||
|  | ||||
| COPY requirements.txt $BUILD_TMP/. | ||||
| RUN pip install -i $PIP_SOURCE -r $BUILD_TMP/requirements.txt | ||||
|  | ||||
| # set local | ||||
| ENV LANG C.UTF-8 LC_ALL=C.UTF-8 | ||||
|  | ||||
| # clean up | ||||
| RUN rm -rf $BUILD_TMP | ||||
|  | ||||
| # initialize workspace | ||||
| WORKDIR /workspace | ||||
|  | ||||
| CMD ["/bin/bash", "/workspace/start.sh"] | ||||
							
								
								
									
										24
									
								
								docker/docker-compose.yml
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										24
									
								
								docker/docker-compose.yml
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,24 @@ | ||||
| version: "3" | ||||
| services: | ||||
|     api_server: | ||||
|         build: . | ||||
|         restart: unless-stopped | ||||
|         network_mode: host | ||||
|         volumes: | ||||
|             - ./start.sh:/workspace/start.sh | ||||
|             # change here to mount all your models | ||||
|             - models_path:/workspace/models # "models" contain multiple models | ||||
|         environment: | ||||
|             # change "main" to your model name | ||||
|             - MODEL_PATH=/workspace/models/main | ||||
|             - MAX_MODEL_LEN=4096  # max model input length | ||||
|             - HOST=127.0.0.1 | ||||
|             - PORT=9001  # change to your port | ||||
|             - API_KEY=token-123456  # change to your api key for security | ||||
|         deploy: | ||||
|             resources: | ||||
|                 reservations: | ||||
|                     devices: | ||||
|                         - driver: "nvidia" | ||||
|                           device_ids: ['0']  # gpu id, change to your gpu id | ||||
|                           capabilities: ["gpu"] | ||||
							
								
								
									
										3
									
								
								docker/requirements.txt
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										3
									
								
								docker/requirements.txt
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,3 @@ | ||||
| accelerate==0.28.0 | ||||
| vllm==0.4.0.post1 | ||||
| openai==1.16.1 | ||||
							
								
								
									
										13
									
								
								docker/sources.list
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										13
									
								
								docker/sources.list
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,13 @@ | ||||
| # 默认注释了源码镜像以提高 apt update 速度,如有需要可自行取消注释 | ||||
| deb https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ focal main restricted universe multiverse | ||||
| # deb-src https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ focal main restricted universe multiverse | ||||
| deb https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ focal-updates main restricted universe multiverse | ||||
| # deb-src https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ focal-updates main restricted universe multiverse | ||||
| deb https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ focal-backports main restricted universe multiverse | ||||
| # deb-src https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ focal-backports main restricted universe multiverse | ||||
| deb https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ focal-security main restricted universe multiverse | ||||
| # deb-src https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ focal-security main restricted universe multiverse | ||||
|  | ||||
| # 预发布软件源,不建议启用 | ||||
| # deb https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ focal-proposed main restricted universe multiverse | ||||
| # deb-src https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ focal-proposed main restricted universe multiverse | ||||
							
								
								
									
										1
									
								
								docker/start.sh
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										1
									
								
								docker/start.sh
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1 @@ | ||||
| python -m vllm.entrypoints.openai.api_server --dtype bfloat16 --model ${MODEL_PATH} --max-model-len ${MAX_MODEL_LEN} --host ${HOST} --port ${PORT} --api-key ${API_KEY} | ||||
		Reference in New Issue
	
	Block a user