VladTruTru commited on
Commit
50ff487
·
verified ·
1 Parent(s): ef62f24
Files changed (1) hide show
  1. Dockerfile +19 -7
Dockerfile CHANGED
@@ -2,16 +2,28 @@
2
  # you will also find guides on how best to write your Dockerfile
3
 
4
  # FROM python:3.9
5
- FROM ollama:0.1.44
6
 
7
- RUN useradd -m -u 1000 user
8
- USER user
9
- ENV PATH="/home/user/.local/bin:$PATH"
10
 
11
  WORKDIR /app
12
 
13
- COPY --chown=user ./requirements.txt requirements.txt
14
- RUN pip install --no-cache-dir --upgrade -r requirements.txt
 
 
15
 
16
  COPY --chown=user . /app
17
- CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]
 
 
 
 
 
 
 
 
 
 
 
2
  # you will also find guides on how best to write your Dockerfile
3
 
4
  # FROM python:3.9
5
+ FROM ollama/ollama:0.12.1-rc0
6
 
7
+ # RUN useradd -m -u 1000 ollama
8
+ # USER user
9
+ # ENV PATH="/home/user/.local/bin:$PATH"
10
 
11
  WORKDIR /app
12
 
13
+ # COPY --chown=user ./requirements.txt requirements.txt
14
+ # RUN pip install --no-cache-dir --upgrade -r requirements.txt
15
+
16
+ RUN which ollama
17
 
18
  COPY --chown=user . /app
19
+ RUN ls -alh ./
20
+ #Override the entrypoint to run the vLLM server with your model
21
+ ENTRYPOINT ["python3", "./app.py"]
22
+ # , "&&",\
23
+ # "python3", "-m", "vllm.entrypoints.openai.api_server", \
24
+ # "--model", "Qwen/Qwen3-8B", \
25
+ # "--host", "0.0.0.0", \
26
+ # "--port", "7860", \
27
+ # "--tensor-parallel-size", "4", \
28
+ # "--trust-remote-code" ]
29
+ # # CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]