Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
24 changes: 0 additions & 24 deletions Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -253,24 +253,6 @@ COPY server/custom_kernels/ /usr/src/.
RUN cd /usr/src && python setup.py build_ext && python setup.py install


## Build transformers exllama kernels ##########################################
FROM python-builder as exllama-kernels-builder

WORKDIR /usr/src

COPY server/exllama_kernels/ .
RUN python setup.py build


## Build transformers exllamav2 kernels ########################################
FROM python-builder as exllamav2-kernels-builder

WORKDIR /usr/src

COPY server/exllamav2_kernels/ .
RUN python setup.py build


## Flash attention v2 cached build image #######################################
FROM base as flash-att-v2-cache

Expand Down Expand Up @@ -301,12 +283,6 @@ ENV PATH=/opt/tgis/bin:$PATH
RUN --mount=type=bind,from=flash-att-v2-cache,src=/usr/src/flash-attention-v2,target=/usr/src/flash-attention-v2 \
pip install /usr/src/flash-attention-v2/*.whl --no-cache-dir

# Copy build artifacts from exllama kernels builder
COPY --from=exllama-kernels-builder /usr/src/build/lib.linux-x86_64-cpython-* ${SITE_PACKAGES}

# Copy build artifacts from exllamav2 kernels builder
COPY --from=exllamav2-kernels-builder /usr/src/build/lib.linux-x86_64-cpython-* ${SITE_PACKAGES}

# Copy over the auto-gptq wheel and install it
RUN --mount=type=bind,from=auto-gptq-cache,src=/usr/src/auto-gptq-wheel,target=/usr/src/auto-gptq-wheel \
pip install /usr/src/auto-gptq-wheel/*.whl --no-cache-dir
Expand Down
71 changes: 0 additions & 71 deletions server/exllama_kernels/exllama_kernels/cuda_buffers.cu

This file was deleted.

52 changes: 0 additions & 52 deletions server/exllama_kernels/exllama_kernels/cuda_buffers.cuh

This file was deleted.

58 changes: 0 additions & 58 deletions server/exllama_kernels/exllama_kernels/cuda_compat.cuh

This file was deleted.

61 changes: 0 additions & 61 deletions server/exllama_kernels/exllama_kernels/cuda_func/column_remap.cu

This file was deleted.

19 changes: 0 additions & 19 deletions server/exllama_kernels/exllama_kernels/cuda_func/column_remap.cuh

This file was deleted.

Loading