This repository has been archived by the owner on Mar 29, 2024. It is now read-only.
forked from patil-suraj/wav2vec2-sprint
-
Notifications
You must be signed in to change notification settings - Fork 9
/
Copy pathDockerfile
56 lines (45 loc) · 1.52 KB
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
FROM ovhcom/ai-training-one-for-all
RUN apt-get update && \
apt install -y bash \
build-essential \
libsndfile1-dev \
git-lfs \
sox
RUN python3 -m pip install --no-cache-dir --upgrade pip && \
python3 -m pip install --no-cache-dir \
datasets \
jiwer==2.2.0 \
soundfile \
torchaudio \
lang-trans==0.6.0 \
librosa==0.8.0
RUN pip3 uninstall -y typing allennlp
RUN pip3 install git+https://github.com/huggingface/transformers.git
RUN mkdir -p /workspace/wav2vec/
COPY fine-tune-xlsr-wav2vec2-on-turkish-asr-with-transformers.ipynb finetune.sh run_common_voice.py finetune_with_params.sh /workspace/wav2vec/
COPY home-server.html run_all.sh /usr/bin/
RUN chown -R 42420:42420 /workspace
RUN chown -R 42420:42420 /usr/bin/run_all.sh
#Default training env variables
ENV model_name_or_path="facebook/wav2vec2-large-xlsr-53" \
dataset_config_name="fr" \
output_dir="/workspace/output_models/wav2vec2-large-xlsr-french-demo" \
cache_dir="/workspace/data" \
num_train_epochs="1" \
per_device_train_batch_size="32" \
per_device_eval_batch_size="32" \
evaluation_strategy="steps" \
learning_rate="3e-4" \
warmup_steps="500" \
save_steps="10" \
eval_steps="10" \
save_total_limit="1" \
logging_steps="10" \
feat_proj_dropout="0.0" \
layerdrop="0.1" \
max_train_samples=100 \
max_val_samples=100
WORKDIR /workspace
ENTRYPOINT []
#CMD ["sh", "/usr/bin/run_all.sh"]
CMD ["supervisord", "-n", "-u", "42420", "-c", "/etc/supervisor/supervisor.conf"]