forked from mozilla/DeepSpeech
-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathDockerfile.train.tmpl
61 lines (53 loc) · 2.24 KB
/
Dockerfile.train.tmpl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
# Please refer to the TRAINING documentation, "Basic Dockerfile for training"
FROM tensorflow/tensorflow:1.15.4-gpu-py3
ENV DEBIAN_FRONTEND=noninteractive \
DEEPSPEECH_REPO=#DEEPSPEECH_REPO# \
DEEPSPEECH_SHA=#DEEPSPEECH_SHA#
RUN apt-get update && apt-get install -y --no-install-recommends \
apt-utils \
bash-completion \
build-essential \
cmake \
curl \
git \
libboost-all-dev \
libbz2-dev \
liblzma-dev \
locales \
python3-venv \
unzip \
xz-utils \
wget && \
# We need to remove it because it's breaking deepspeech install later with \
# weird errors about setuptools \
apt-get purge -y python3-xdg && \
# Install dependencies for audio augmentation \
apt-get install -y --no-install-recommends libopus0 libsndfile1 && \
# Try and free some space \
rm -rf /var/lib/apt/lists/*
WORKDIR /
RUN git clone $DEEPSPEECH_REPO DeepSpeech && \
cd /DeepSpeech && git fetch origin $DEEPSPEECH_SHA && git checkout $DEEPSPEECH_SHA && \
git submodule sync kenlm/ && git submodule update --init kenlm/
# Build CTC decoder first, to avoid clashes on incompatible versions upgrades
RUN cd /DeepSpeech/native_client/ctcdecode && make NUM_PROCESSES=$(nproc) bindings && \
pip3 install --upgrade dist/*.whl
# Prepare deps
RUN cd /DeepSpeech && pip3 install --upgrade pip==20.2.2 wheel==0.34.2 setuptools==49.6.0 && \
# Install DeepSpeech \
# - No need for the decoder since we did it earlier \
# - There is already correct TensorFlow GPU installed on the base image, \
# we don't want to break that \
DS_NODECODER=y DS_NOTENSORFLOW=y pip3 install --upgrade -e . && \
# Tool to convert output graph for inference \
curl -vsSL https://github.com/mozilla/DeepSpeech/releases/download/v0.9.3/linux.amd64.convert_graphdef_memmapped_format.xz | xz -d > convert_graphdef_memmapped_format && \
chmod +x convert_graphdef_memmapped_format
# Build KenLM to generate new scorers
WORKDIR /DeepSpeech/kenlm
RUN wget -O - https://gitlab.com/libeigen/eigen/-/archive/3.3.8/eigen-3.3.8.tar.bz2 | tar xj && \
mkdir -p build && \
cd build && \
EIGEN3_ROOT=/DeepSpeech/kenlm/eigen-3.3.8 cmake .. && \
make -j $(nproc)
WORKDIR /DeepSpeech
RUN ./bin/run-ldc93s1.sh