title: Docker搭建vicuna tags: [] id: '2723' categories:
项目地址:llama-cpp-python
镜像地址:hub-mirror
模型地址:ggml-vic13b-q5_1.bin
前端UI地址(目前仍不兼容):BetterChatGPT
version: '3.3'
services:
llama:
ports:
- '1234:8000'
restart: always
environment:
MODEL: /models/ggml-vic13b-q5_1.bin
volumes:
- './models:/models'
image: togettoyou/ghcr.io.abetlen.llama-cpp-python:latest
command: ["python3", "-m", "llama_cpp.server", "--model", "/models/ggml-vic13b-q5_1.bin"]
查看文档:http://localhost:1234/docs
curl http://localhost:1234/v1/chat/completions \
-H 'Content-Type: application/json' \
-d '{
"model": "gpt-3.5-turbo",
"messages": [{"role": "user", "content": "Hello!"}]
}'