ariG23498 HF staff commited on
Commit
b676ee0
·
1 Parent(s): 2ad3c12
Files changed (2) hide show
  1. Dockerfile +23 -0
  2. README.md +1 -0
Dockerfile ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Hugging Face TGI image
2
+ FROM ghcr.io/huggingface/text-generation-inference:3.0.2
3
+
4
+ # Set working directory
5
+ WORKDIR /app
6
+
7
+ # Create the /data directory inside the container
8
+ RUN mkdir -p /data
9
+ RUN chmod 777 /data
10
+ RUN mkdir -p /.cache
11
+ RUN chmod 777 /.cache
12
+ RUN mkdir -p /.triton
13
+ RUN chmod 777 /.triton
14
+
15
+ # Expose the model on port 8080
16
+ EXPOSE 8080
17
+
18
+ # Set the Hugging Face token as an environment variable
19
+ ARG HF_TOKEN
20
+ ENV HF_TOKEN=${HF_TOKEN}
21
+
22
+ # Run the TGI server directly
23
+ CMD ["--model-id", "allenai/OLMo-2-1124-7B-Instruct", "--port", "8080"]
README.md CHANGED
@@ -4,6 +4,7 @@ emoji: 👀
4
  colorFrom: green
5
  colorTo: red
6
  sdk: docker
 
7
  pinned: false
8
  short_description: TGI deployment of OLMo2
9
  ---
 
4
  colorFrom: green
5
  colorTo: red
6
  sdk: docker
7
+ app_port: 8080
8
  pinned: false
9
  short_description: TGI deployment of OLMo2
10
  ---