You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
14 lines
565 B
Docker
14 lines
565 B
Docker
FROM nvidia/cuda:12.1.0-devel-ubuntu22.04
|
|
|
|
RUN apt-get update && \
|
|
apt-get -y install python3.10 python3-pip openmpi-bin libopenmpi-dev git && \
|
|
rm -rf /var/lib/apt/lists/*
|
|
|
|
RUN pip install tensorrt_llm==0.8.0.dev2024011601 -U --no-cache-dir --pre --extra-index-url https://pypi.nvidia.com
|
|
|
|
RUN pip install --no-cache-dir modelscope==1.11.1
|
|
|
|
RUN git clone https://github.com/NVIDIA/TensorRT-LLM.git && \
|
|
cd TensorRT-LLM && \
|
|
git checkout c89653021e66ca78c55f02b366f404455bc12e8d && \
|
|
pip install --no-cache-dir -r examples/qwen/requirements.txt |