-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathDockerfile.cuda
41 lines (32 loc) · 971 Bytes
/
Dockerfile.cuda
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
FROM pytorch/pytorch:2.2.2-cuda12.1-cudnn8-runtime
ADD src /app
ADD requirements.txt /app
WORKDIR /app
RUN pip install transformers
RUN pip install -r requirements.txt
# Generic configuration
ENV OPENAI_API_KEY=""
ENV NLP_CLOUD_API_KEY=""
# Pool configuration
ENV POOL_ADDRESS="127.0.0.1"
ENV POOL_PORT="5000"
# Embeddings configuration
ENV EMBEDDINGS_TRANSFORMERS_DEVICE="-1"
ENV EMBEDDINGS_CACHE_PATH="/cache"
ENV EMBEDDINGS_HF_HOME="/cache/hugginface"
ENV EMBEDDINGS_MODEL="intfloat/multilingual-e5-base"
ENV EMBEDDINGS_MAX_TEXT_LENGTH=512
ENV EMBEDDINGS_ADD_MARKERS_TO_SENTENCES="true"
# Logging configuration
ENV LOG_LEVEL="debug"
ENV OPENOBSERVE_ENDPOINT=""
ENV OPENOBSERVE_ORG="default"
ENV OPENOBSERVE_STREAM="default"
ENV OPENOBSERVE_BASICAUTH=""
ENV OPENOBSERVE_USERNAME=""
ENV OPENOBSERVE_PASSWORD=""
ENV OPENOBSERVE_BATCHSIZE="21"
ENV OPENOBSERVE_FLUSH_INTERVAL="5000"
ENV OPENOBSERVE_LOG_LEVEL="debug"
VOLUME /cache
CMD ["python", "-u", "main.py"]