- Corrected typo in WMMA (was spelt wrong as waam)
- Included rocm-7rc-rocwmma toolbox - Included updated results from benchmarks including rocm 7rc with ROMWMMA and hipBLASLt
This commit is contained in:
@@ -34,12 +34,5 @@ RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \
|
||||
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
|
||||
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
|
||||
|
||||
# Ensure we are using hipblaslt
|
||||
RUN printf '%s\n' \
|
||||
'export ROCBLAS_USE_HIPBLASLT=1' \
|
||||
> /etc/profile.d/rocm.sh \
|
||||
&& chmod +x /etc/profile.d/rocm.sh \
|
||||
&& echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc
|
||||
|
||||
# Default to interactive shell
|
||||
CMD ["/bin/bash"]
|
||||
|
||||
@@ -41,12 +41,5 @@ RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \
|
||||
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
|
||||
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
|
||||
|
||||
# Ensure we are using hipblaslt
|
||||
RUN printf '%s\n' \
|
||||
'export ROCBLAS_USE_HIPBLASLT=1' \
|
||||
> /etc/profile.d/rocm.sh \
|
||||
&& chmod +x /etc/profile.d/rocm.sh \
|
||||
&& echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc
|
||||
|
||||
# Default to interactive shell
|
||||
CMD ["/bin/bash"]
|
||||
@@ -48,11 +48,11 @@ RUN printf '%s\n' \
|
||||
&& chmod +x /etc/profile.d/rocm.sh \
|
||||
&& echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc
|
||||
|
||||
# Install ROCWAAM
|
||||
# Install rocwmma
|
||||
WORKDIR /opt/
|
||||
COPY ./build-rocwaam.sh .
|
||||
RUN chmod +x build-rocwaam.sh
|
||||
RUN ./build-rocwaam.sh
|
||||
COPY ./build-rocwmma.sh .
|
||||
RUN chmod +x build-rocwmma.sh
|
||||
RUN ./build-rocwmma.sh
|
||||
|
||||
# 6) Clone llama.cpp
|
||||
WORKDIR /opt/llama.cpp
|
||||
@@ -60,7 +60,7 @@ RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . \
|
||||
&& git clean -xdf \
|
||||
&& git submodule update --recursive
|
||||
|
||||
# Apply PAtch for ROCWAAM
|
||||
# Apply PAtch for rocwmma
|
||||
COPY ./apply-rocwmma-fix.sh /opt
|
||||
RUN chmod +x /opt/apply-rocwmma-fix.sh
|
||||
RUN /opt/apply-rocwmma-fix.sh /opt/llama.cpp
|
||||
@@ -2,6 +2,7 @@
|
||||
|
||||
# apply-rocwmma-fix.sh - Apply rocWMMA compatibility fixes to llama.cpp
|
||||
# Usage: ./apply-rocwmma-fix.sh <path-to-llama.cpp-directory>
|
||||
# Source: https://github.com/lhl/strix-halo-testing/blob/main/llm-bench/apply-rocwmma-fix.sh
|
||||
|
||||
set -euo pipefail
|
||||
|
||||
|
||||
@@ -1,3 +1,4 @@
|
||||
# Source: https://github.com/lhl/strix-halo-testing/blob/main/llm-bench/build-rocwmma.sh
|
||||
git clone https://github.com/ROCm/rocWMMA
|
||||
cd rocWMMA
|
||||
|
||||
|
||||
Reference in New Issue
Block a user