Skip to content

Commit

Permalink
add punkt
Browse files Browse the repository at this point in the history
  • Loading branch information
AlisoSouza committed Mar 8, 2024
1 parent bc29ee8 commit dcbf047
Showing 1 changed file with 8 additions and 1 deletion.
9 changes: 8 additions & 1 deletion Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -9,9 +9,16 @@ COPY pyproject.toml poetry.lock ./
RUN poetry config virtualenvs.create false && \
poetry install --no-dev

RUN apt update && apt install libmagic1 -y
RUN apt update && apt install libmagic1 curl unzip -y
RUN poetry add python-magic

RUN curl https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/packages/tokenizers/punkt.zip --output punkt.zip
RUN mkdir nltk_data
RUN mkdir -p /nltk_data/tokenizers/
RUN unzip punkt.zip
RUN mv punkt/ /nltk_data/tokenizers/
RUN rm punkt.zip

COPY . .

EXPOSE 8000
Expand Down

0 comments on commit dcbf047

Please sign in to comment.