zhijian's picture
Update Dockerfile
6a12082
raw
history blame contribute delete
No virus
497 Bytes
FROM python:3.8
RUN apt update && apt install -y default-jdk default-jre git
ENV JAVA_HOME=/usr/lib/jvm/default-java
RUN pip install "py-data-juicer[all] @ git+https://github.com/alibaba/data-juicer.git"
RUN pip install fsspec==2023.3.0
RUN useradd -m -u 1000 dj
USER dj
ENV HOME=/home/dj
RUN cd $HOME/ && git clone https://github.com/alibaba/data-juicer.git && cd ../
WORKDIR $HOME/data-juicer/demos/tool_dataset_splitting_by_language
RUN chown -R dj $HOME/
CMD ["streamlit", "run", "app.py"]