Skip to content

Commit a01d523

Browse files
committed
add produce training data dockerfile
1 parent e5bc4ba commit a01d523

File tree

1 file changed

+38
-0
lines changed

1 file changed

+38
-0
lines changed

image-build-process/Dockerfile

Lines changed: 38 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,38 @@
1+
FROM python:3.7
2+
3+
4+
RUN apt-get update
5+
RUN apt-get install ffmpeg libsm6 libxext6 -y
6+
# ENV LANG=en_US.utf8
7+
# ENV LANG=C.UTF-8
8+
9+
# ENV PYTHONUNBUFFERED=TRUE
10+
# ENV PYTHONDONTWRITEBYTECODE=TRUE
11+
# ENV PATH="/opt/program:${PATH}"
12+
13+
# RUN pip3 install --upgrade pip
14+
15+
# ## install paddlepaddle framework
16+
# RUN pip3 install paddlepaddle-gpu -i https://mirror.baidu.com/pypi/simple
17+
# RUN pip3 install paddleocr==2.0.1
18+
19+
# ## clone PaddleOCR source code
20+
# RUN git clone -b release/2.1 https://github.com/PaddlePaddle/PaddleOCR.git /opt/program/
21+
22+
23+
# #download pretrained model for finetunine
24+
# RUN mkdir /opt/program/pretrain/
25+
# RUN cd /opt/program/pretrain/
26+
# RUN wget -P /opt/program/pretrain/ https://paddleocr.bj.bcebos.com/dygraph_v2.0/ch/ch_ppocr_mobile_v2.0_rec_train.tar && tar -xf /opt/program/pretrain/ch_ppocr_mobile_v2.0_rec_train.tar -C /opt/program/pretrain/ && rm -rf /opt/program/pretrain/ch_ppocr_mobile_v2.0_rec_train.tar
27+
28+
# Set up the program in the image
29+
RUN git clone https://github.com/catwhiskers/ocr_data_generator.git
30+
31+
#WORKDIR /opt/program
32+
RUN cd ./ocr_data_generator && pip install -r requirements.txt && python generate_data.py seto_font train data/ZH_1.txt setofont
33+
34+
35+
# ENTRYPOINT ["python3", "train.py"]
36+
37+
38+

0 commit comments

Comments
 (0)