-
Notifications
You must be signed in to change notification settings - Fork 0
/
Dockerfile
174 lines (153 loc) · 5.85 KB
/
Dockerfile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
FROM ubuntu:23.10
MAINTAINER Darrell Ricke <[email protected]>
################################################################################
# Author: Darrell O. Ricke, Ph.D. (email: [email protected])
#
# RAMS request ID 1028310
# RAMS title: Artificial Intelligence tools for Knowledge-Intensive Tasks (AIKIT)
#
# DISTRIBUTION STATEMENT A. Approved for public release. Distribution is unlimited.
#
# This material is based upon work supported by the Department of the Air Force
# under Air Force Contract No. FA8702-15-D-0001. Any opinions, findings,
# conclusions or recommendations expressed in this material are those of the
# author(s) and do not necessarily reflect the views of the Department of the Air Force.
#
# Copyright © 2024 Massachusetts Institute of Technology.
#
# Subject to FAR52.227-11 Patent Rights - Ownership by the contractor (May 2014)
#
# The software/firmware is provided to you on an As-Is basis
#
# Delivered to the U.S. Government with Unlimited Rights, as defined in DFARS
# Part 252.227-7013 or 7014 (Feb 2014). Notwithstanding any copyright notice,
# U.S. Government rights in this work are defined by DFARS 252.227-7013 or
# DFARS 252.227-7014 as detailed above. Use of this work other than as
# specifically authorized by the U.S. Government may violate any copyrights
# that exist in this work.
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
################################################################################
ENV LC_ALL en_US.UTF-8
ENV LANG en_US.UTF-8
# libcurl4-openssl-dev \
RUN apt-get update && apt-get install -y build-essential coreutils \
wget bzip2 git g++ gfortran libreadline6-dev libncurses5-dev xorg-dev libpng-dev libbz2-dev \
liblzma-dev libpcre3-dev make libcairo2-dev libgtk2.0-dev \
locales libcurl4-nss-dev \
language-pack-en language-pack-en-base \
git curl unzip bc tabix \
libssl-dev libgit2-dev libssh2-1-dev \
gcc zip \
python3.11 gcc zip python3-dev \
zlib1g-dev libbz2-dev liblzma-dev pigz libncurses5-dev \
libreadline-dev \
openssl \
gnupg2 \
libmysqlclient-dev \
nodejs \
sqlite3 \
ruby-full rubygems vim libyaml-dev libsqlite3-dev default-jre
RUN apt-get install -y libleptonica-dev tesseract-ocr libtesseract-dev python3-pil tesseract-ocr-eng tesseract-ocr-script-latn
RUN mkdir /S
RUN gem install bundler \
&& gem install mysql2 \
&& gem install sqlite3 \
&& gem install rake \
&& gem install tzinfo-data \
&& gem install rails
WORKDIR /S
RUN curl https://bootstrap.pypa.io/pip/3.6/get-pip.py -o get-pip.py \
&& python3 get-pip.py
# COPY wgetrc /etc
WORKDIR /S
RUN curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs > sh.rustup.rs \
&& chmod +x sh.rustup.rs \
&& ./sh.rustup.rs -y
ENV PATH=~/.cargo/bin:$PATH
COPY llms_requirements.txt /S
RUN pip install -r llms_requirements.txt
RUN pip install llama-cpp-python \
&& pip install fastapi uvicorn sse-starlette requests
RUN pip install numba
RUN pip install transformers \
&& pip install gradio \
&& pip install langchain-community==0.2.1 langchain-core==0.2.1 \
&& pip install langchain \
&& pip install "langserve[all]" \
&& pip install langchain_openai \
&& pip install langchainhub \
&& pip install langgraph \
&& pip install scipy \
&& pip install einops \
&& pip install bitsandbytes
RUN git clone https://github.com/facebookresearch/llama.git
WORKDIR /S/llama
RUN pip install .
WORKDIR /S
RUN curl -fsSL https://nvidia.github.io/libnvidia-container/gpgkey | gpg --dearmor --no-tty -o /usr/share/keyrings/nvidia-container-toolkit-keyring.gpg \
&& curl -s -L https://nvidia.github.io/libnvidia-container/stable/deb/nvidia-container-toolkit.list | \
sed 's#deb https://#deb [signed-by=/usr/share/keyrings/nvidia-container-toolkit-keyring.gpg] https://#g' | \
tee /etc/apt/sources.list.d/nvidia-container-toolkit.list \
&& \
apt-get update
RUN apt-get install -y nvidia-container-toolkit
RUN pip install build \
&& pip install chromadb \
&& pip install datasets \
&& pip install faiss-cpu \
&& pip install langchain-chroma \
&& pip install langchain_mistralai \
&& pip install peft \
&& pip install pettingzoo \
&& pip install pypdf \
&& pip install pypdf[crypto]
RUN pip install sentence-transformers \
&& pip install tensorflow \
&& pip install tokenizers \
&& pip install torch \
&& pip install tqdm \
&& pip install trl \
&& pip install "unstructured[all-docs]" \
&& pip install docx \
&& pip install "transformers[sentencepiece]" \
&& pip install langchain-huggingface \
&& pip install pytesseract \
&& pip install tf-keras \
&& pip install tensorrt
RUN pip install accelerate --upgrade
WORKDIR /S
ENV HF_HOME=/io
ENV HF_HUB_CACHE=/io/hub
ENV HF_ASSETS_CACHE=/io/assets
WORKDIR /S
COPY AIKIT_UI.tar /S
RUN tar -xf AIKIT_UI.tar
# COPY AIKIT_UI /S
WORKDIR /S/AIKIT_UI
RUN bundle update
# RUN rails db:migrate VERSION=0
RUN rails db:migrate
RUN bundle exec rake assets:precompile RAILS_ENV=development
RUN bundle exec rake assets:precompile RAILS_ENV=production
WORKDIR /io
# ENV TRANSFORMERS_OFFLINE="1"
# ENV HF_DATASETS_OFFLINE="1"
# ENV HF_HUB_OFFLINE="1"
ENV SENTENCE_TRANSFORMERS_HOME=/io/Sentences
COPY entrypoint.sh /usr/bin
RUN chmod +x /usr/bin/entrypoint.sh
COPY entrypoint.sh /usr/local/bin
RUN chmod +x /usr/local/bin/entrypoint.sh
ENTRYPOINT ["entrypoint.sh"]
EXPOSE 3000
EXPOSE 7860
EXPOSE 8888