Bushra-KB commited on
Commit
ef48146
·
verified ·
1 Parent(s): 95141bb

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +7 -3
Dockerfile CHANGED
@@ -1,4 +1,4 @@
1
- FROM python:3.12-slim
2
 
3
  # Set environment variables for caching to a writable directory
4
  # These will be used by huggingface libraries to store models and other assets.
@@ -11,11 +11,15 @@ ENV HF_DATASETS_CACHE=/data/huggingface/datasets
11
  RUN mkdir -p $TRANSFORMERS_CACHE $HF_DATASETS_CACHE $TORCH_HOME && \
12
  chmod -R 777 /data
13
 
14
- # System deps for soundfile and audio encoding
15
  RUN apt-get update && apt-get install -y --no-install-recommends \
16
- libsndfile1 ffmpeg git && \
17
  rm -rf /var/lib/apt/lists/*
18
 
 
 
 
 
19
  WORKDIR /app
20
 
21
  # Install Python deps
 
1
+ FROM python:3.14-slim
2
 
3
  # Set environment variables for caching to a writable directory
4
  # These will be used by huggingface libraries to store models and other assets.
 
11
  RUN mkdir -p $TRANSFORMERS_CACHE $HF_DATASETS_CACHE $TORCH_HOME && \
12
  chmod -R 777 /data
13
 
14
+ # System deps for soundfile, audio encoding, and uroman
15
  RUN apt-get update && apt-get install -y --no-install-recommends \
16
+ libsndfile1 ffmpeg git perl && \
17
  rm -rf /var/lib/apt/lists/*
18
 
19
+ # Clone and install uroman from source so the tokenizer can find it
20
+ RUN git clone https://github.com/isi-nlp/uroman.git /opt/uroman && \
21
+ ln -s /opt/uroman/bin/uroman.pl /usr/local/bin/uroman
22
+
23
  WORKDIR /app
24
 
25
  # Install Python deps