File tree Expand file tree Collapse file tree 5 files changed +10
-119
lines changed
applications/DeepSpeed-Chat Expand file tree Collapse file tree 5 files changed +10
-119
lines changed Original file line number Diff line number Diff line change @@ -41,13 +41,12 @@ RUN python -m pip install --upgrade pip setuptools wheel
4141
4242WORKDIR /workspace
4343
44- # Copy and install dependencies
45- COPY requirements.txt requirements_freeze.txt ./
46- RUN pip install -r requirements_freeze.txt
44+ # Install PyTorch first with CUDA 11.8 support
45+ RUN pip install torch==2.1.0 torchvision==0.16.0 torchaudio==2.1.0 --index-url https://download.pytorch.org/whl/cu118
4746
48- # Install additional packages that may be needed
49- # H100/H200 specific versions
50- RUN pip install --force-reinstall numpy==1.24.4 torch==2.5.0 pyarrow==18.0.0 tensorboard
47+ # Copy and install other dependencies
48+ COPY training/requirements_freeze.txt ./
49+ RUN pip install -r requirements_freeze.txt
5150
5251# Copy project code
5352COPY . .
Original file line number Diff line number Diff line change @@ -12,10 +12,10 @@ services:
1212 command : /bin/bash -c "/usr/sbin/sshd && tail -f /dev/null"
1313
1414 environment :
15- - PROJECT_PATH=${PROJECT_PATH}
16- - HF_HOME=${PROJECT_PATH}/.cache/huggingface
17- - TRANSFORMERS_CACHE=${PROJECT_PATH}/.cache/huggingface/transformers
18- - HF_DATASETS_CACHE=${PROJECT_PATH}/.cache/huggingface/datasets
15+ - PROJECT_PATH=${PROJECT_PATH:-/workspace }
16+ - HF_HOME=${PROJECT_PATH:-/workspace }/.cache/huggingface
17+ - TRANSFORMERS_CACHE=${PROJECT_PATH:-/workspace }/.cache/huggingface/transformers
18+ - HF_DATASETS_CACHE=${PROJECT_PATH:-/workspace }/.cache/huggingface/datasets
1919 - NVIDIA_VISIBLE_DEVICES=all
2020 - NVIDIA_DRIVER_CAPABILITIES=compute,utility
2121
Load Diff This file was deleted.
Original file line number Diff line number Diff line change @@ -30,7 +30,7 @@ mpmath==1.3.0
3030msgpack==1.1.2
3131multidict==6.7.0
3232multiprocess==0.70.15
33- networkx==3.5
33+ networkx==3.1
3434ninja==1.13.0
3535numpy==1.26.4
3636nvidia-cublas-cu12==12.8.4.1
@@ -75,9 +75,6 @@ sniffio==1.3.1
7575sympy==1.14.0
7676termcolor==3.1.0
7777tokenizers==0.20.1
78- torch==2.9.0+cu128
79- torchaudio==2.9.0+cu128
80- torchvision==0.24.0+cu128
8178tqdm==4.67.1
8279transformers==4.46.3
8380triton==3.5.0
Load Diff This file was deleted.
You can’t perform that action at this time.
0 commit comments