jsjolund · June 6, 2024 00:37
diff --git a/README.md b/README.md
diff --git a/Dockerfile b/Dockerfile
 FROM nvcr.io/nvidia/cuda:12.1.1-cudnn8-devel-ubuntu22.04

 # Set environment variables
 ENV DEBIAN_FRONTEND=noninteractive\
    SHELL=/bin/bash\
    PATH="/opt/venv/bin:$PATH"

 RUN echo "en_US.UTF-8 UTF-8" > /etc/locale.gen

 # Install apt packages
 RUN apt-get update && apt-get upgrade -y
 RUN apt-get install -y --no-install-recommends \
    git wget curl build-essential \
    python3-dev python3-venv python3-pip python-is-python3
 RUN apt-get clean

 # Create a virtual Python environment
 RUN python3 -m venv /opt/venv
 ENV PATH="/opt/venv/bin:$PATH"

 # Upgrade pip
 RUN pip install --upgrade pip setuptools wheel virtualenv

 # Install Torch with CUDA 12.1 support
 RUN pip install torch torchvision torchaudio --pre -f https://download.pytorch.org/whl/nightly/cu121/torch_nightly.html

 # Install llama python bindings from source
 RUN pip install git+https://github.com/abetlen/llama-cpp-python.git

 # Install lollms and lollms-webui in editable mode for debugging
 RUN mkdir /src
 RUN git clone --recurse-submodules https://github.com/ParisNeo/lollms.git /src/lollms
 RUN cd /src/lollms \
    && pip install -r requirements.txt -e .

 RUN git clone --recurse-submodules https://github.com/ParisNeo/lollms-webui.git /src/lollms-webui
 RUN cd /src/lollms-webui \
    && pip install -r requirements.txt -e .

 # Entrypoint
 ADD start.sh /
 RUN chmod +x /start.sh
 CMD [ "/start.sh" ]
diff --git a/start.sh b/start.sh
 #!/bin/bash

 # Show commands being ran
 set -x

 # Check if the CPU limit is set
 [[ ! $CPU_THREADS ]] && CPU_THREADS=$(nproc)

 # Configure lollms paths for the webui
 [[ ! -f /src/lollms-webui/global_paths_cfg.yaml ]] && mkdir -p /src/lollms-webui && printf 'lollms_path: /src/lollms/lollms\nlollms_personal_path: /cache' > /src/lollms-webui/global_paths_cfg.yaml

 # Create download directories for the models
 mkdir -p /cache/models/{py_llama_cpp,c_transformers,llama_cpp_official,binding_template,gpt_j_m,gpt_4all,open_ai,gpt_j_a,gptq,hugging_face} || true

 # Activate the python environment and start the web server
 source /opt/venv/bin/activate
 cd /src/lollms-webui
 python app.py -m Wizard-Vicuna-13B-Uncensored.ggmlv3.q4_K_S.bin --host 0.0.0.0 --port 8080 --n_threads "$CPU_THREADS"
	FROM nvcr.io/nvidia/cuda:12.1.1-cudnn8-devel-ubuntu22.04

	# Set environment variables
	ENV DEBIAN_FRONTEND=noninteractive\
	SHELL=/bin/bash\
	PATH="/opt/venv/bin:$PATH"

	RUN echo "en_US.UTF-8 UTF-8" > /etc/locale.gen

	# Install apt packages
	RUN apt-get update && apt-get upgrade -y
	RUN apt-get install -y --no-install-recommends \
	git wget curl build-essential \
	python3-dev python3-venv python3-pip python-is-python3
	RUN apt-get clean

	# Create a virtual Python environment
	RUN python3 -m venv /opt/venv
	ENV PATH="/opt/venv/bin:$PATH"

	# Upgrade pip
	RUN pip install --upgrade pip setuptools wheel virtualenv

	# Install Torch with CUDA 12.1 support
	RUN pip install torch torchvision torchaudio --pre -f https://download.pytorch.org/whl/nightly/cu121/torch_nightly.html

	# Install llama python bindings from source
	RUN pip install git+https://github.com/abetlen/llama-cpp-python.git

	# Install lollms and lollms-webui in editable mode for debugging
	RUN mkdir /src
	RUN git clone --recurse-submodules https://github.com/ParisNeo/lollms.git /src/lollms
	RUN cd /src/lollms \
	&& pip install -r requirements.txt -e .

	RUN git clone --recurse-submodules https://github.com/ParisNeo/lollms-webui.git /src/lollms-webui
	RUN cd /src/lollms-webui \
	&& pip install -r requirements.txt -e .

	# Entrypoint
	ADD start.sh /
	RUN chmod +x /start.sh
	CMD [ "/start.sh" ]
	#!/bin/bash

	# Show commands being ran
	set -x

	# Check if the CPU limit is set
	[[ ! $CPU_THREADS ]] && CPU_THREADS=$(nproc)

	# Configure lollms paths for the webui
	[[ ! -f /src/lollms-webui/global_paths_cfg.yaml ]] && mkdir -p /src/lollms-webui && printf 'lollms_path: /src/lollms/lollms\nlollms_personal_path: /cache' > /src/lollms-webui/global_paths_cfg.yaml

	# Create download directories for the models
	mkdir -p /cache/models/{py_llama_cpp,c_transformers,llama_cpp_official,binding_template,gpt_j_m,gpt_4all,open_ai,gpt_j_a,gptq,hugging_face} \|\| true

	# Activate the python environment and start the web server
	source /opt/venv/bin/activate
	cd /src/lollms-webui
	python app.py -m Wizard-Vicuna-13B-Uncensored.ggmlv3.q4_K_S.bin --host 0.0.0.0 --port 8080 --n_threads "$CPU_THREADS"