Spaces:
				
			
			
	
			
			
		Paused
		
	
	
	
			
			
	
	
	
	
		
		
		Paused
		
	| # devel needed for bitsandbytes requirement of libcudart.so, otherwise runtime sufficient | |
| FROM nvidia/cuda:11.8.0-cudnn8-devel-ubuntu20.04 | |
| ENV DEBIAN_FRONTEND=noninteractive | |
| ENV PATH="/h2ogpt_conda/bin:${PATH}" | |
| ARG PATH="/h2ogpt_conda/bin:${PATH}" | |
| ENV HOME=/workspace | |
| ENV CUDA_HOME=/usr/local/cuda-11.8 | |
| ENV VLLM_CACHE=/workspace/.vllm_cache | |
| WORKDIR /workspace | |
| COPY . /workspace/ | |
| RUN cd /workspace && chmod +x /workspace/docker_build_script_ubuntu.sh && ./docker_build_script_ubuntu.sh | |
| RUN chmod -R a+rwx /workspace | |
| ARG user=h2ogpt | |
| ARG group=h2ogpt | |
| ARG uid=1000 | |
| ARG gid=1000 | |
| RUN groupadd -g ${gid} ${group} && useradd -u ${uid} -g ${group} -s /bin/bash ${user} | |
| EXPOSE 8888 | |
| EXPOSE 7860 | |
| EXPOSE 5000 | |
| USER h2ogpt | |
| # ENTRYPOINT ["python3.10"] | |
| CMD ["python3.10", "generate.py", "--load_8bit", "True", "--base_model", "h2oai/h2ogpt-4096-llama2-7b-chat"] | |