Skip to content

Commit c8995a2

Browse files
author
Joan Martinez
committed
fix: merge issues
2 parents a8a64fd + f5d7b26 commit c8995a2

File tree

124 files changed

+1806
-1780
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

124 files changed

+1806
-1780
lines changed

.devops/full-cuda.Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ FROM ${BASE_CUDA_DEV_CONTAINER} as build
1212
ARG CUDA_DOCKER_ARCH=all
1313

1414
RUN apt-get update && \
15-
apt-get install -y build-essential python3 python3-pip git libcurl4-openssl-dev
15+
apt-get install -y build-essential python3 python3-pip git libcurl4-openssl-dev libgomp1
1616

1717
COPY requirements.txt requirements.txt
1818
COPY requirements requirements

.devops/full.Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ ARG UBUNTU_VERSION=22.04
33
FROM ubuntu:$UBUNTU_VERSION as build
44

55
RUN apt-get update && \
6-
apt-get install -y build-essential python3 python3-pip git libcurl4-openssl-dev
6+
apt-get install -y build-essential python3 python3-pip git libcurl4-openssl-dev libgomp1
77

88
COPY requirements.txt requirements.txt
99
COPY requirements requirements

.devops/main-cuda.Dockerfile

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,10 +23,13 @@ ENV CUDA_DOCKER_ARCH=${CUDA_DOCKER_ARCH}
2323
# Enable CUDA
2424
ENV LLAMA_CUDA=1
2525

26-
RUN make -j$(nproc)
26+
RUN make -j$(nproc) main
2727

2828
FROM ${BASE_CUDA_RUN_CONTAINER} as runtime
2929

30+
RUN apt-get update && \
31+
apt-get install -y libgomp1
32+
3033
COPY --from=build /app/main /main
3134

3235
ENTRYPOINT [ "/main" ]

.devops/main-rocm.Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -40,6 +40,6 @@ ENV LLAMA_HIPBLAS=1
4040
ENV CC=/opt/rocm/llvm/bin/clang
4141
ENV CXX=/opt/rocm/llvm/bin/clang++
4242

43-
RUN make -j$(nproc)
43+
RUN make -j$(nproc) main
4444

4545
ENTRYPOINT [ "/app/main" ]

.devops/main-vulkan.Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ ARG UBUNTU_VERSION=jammy
33
FROM ubuntu:$UBUNTU_VERSION as build
44

55
# Install build tools
6-
RUN apt update && apt install -y git build-essential cmake wget
6+
RUN apt update && apt install -y git build-essential cmake wget libgomp1
77

88
# Install Vulkan SDK
99
RUN wget -qO - https://packages.lunarg.com/lunarg-signing-key-pub.asc | apt-key add - && \

.devops/main.Dockerfile

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,10 +9,13 @@ WORKDIR /app
99

1010
COPY . .
1111

12-
RUN make -j$(nproc)
12+
RUN make -j$(nproc) main
1313

1414
FROM ubuntu:$UBUNTU_VERSION as runtime
1515

16+
RUN apt-get update && \
17+
apt-get install -y libgomp1
18+
1619
COPY --from=build /app/main /main
1720

1821
ENV LC_ALL=C.utf8

.devops/server-cuda.Dockerfile

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -25,12 +25,12 @@ ENV LLAMA_CUDA=1
2525
# Enable cURL
2626
ENV LLAMA_CURL=1
2727

28-
RUN make -j$(nproc)
28+
RUN make -j$(nproc) server
2929

3030
FROM ${BASE_CUDA_RUN_CONTAINER} as runtime
3131

3232
RUN apt-get update && \
33-
apt-get install -y libcurl4-openssl-dev
33+
apt-get install -y libcurl4-openssl-dev libgomp1
3434

3535
COPY --from=build /app/server /server
3636

.devops/server.Dockerfile

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -11,12 +11,12 @@ COPY . .
1111

1212
ENV LLAMA_CURL=1
1313

14-
RUN make -j$(nproc)
14+
RUN make -j$(nproc) server
1515

1616
FROM ubuntu:$UBUNTU_VERSION as runtime
1717

1818
RUN apt-get update && \
19-
apt-get install -y libcurl4-openssl-dev
19+
apt-get install -y libcurl4-openssl-dev libgomp1
2020

2121
COPY --from=build /app/server /server
2222

CMakeLists.txt

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -416,6 +416,8 @@ if (LLAMA_CUDA)
416416
list(APPEND GGML_SOURCES_CUDA "ggml-cuda.cu")
417417
file(GLOB SRCS "ggml-cuda/template-instances/fattn-wmma*.cu")
418418
list(APPEND GGML_SOURCES_CUDA ${SRCS})
419+
file(GLOB SRCS "ggml-cuda/template-instances/mmq*.cu")
420+
list(APPEND GGML_SOURCES_CUDA ${SRCS})
419421

420422
add_compile_definitions(GGML_USE_CUDA)
421423
add_compile_definitions(GGML_CUDA_USE_GRAPHS)
@@ -588,6 +590,8 @@ if (LLAMA_HIPBLAS)
588590
list(APPEND GGML_SOURCES_ROCM "ggml-cuda.cu")
589591
file(GLOB SRCS "ggml-cuda/template-instances/fattn-wmma*.cu")
590592
list(APPEND GGML_SOURCES_ROCM ${SRCS})
593+
file(GLOB SRCS "ggml-cuda/template-instances/mmq*.cu")
594+
list(APPEND GGML_SOURCES_ROCM ${SRCS})
591595

592596
add_compile_definitions(GGML_USE_HIPBLAS GGML_USE_CUDA)
593597

Makefile

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -444,6 +444,7 @@ ifdef LLAMA_CUBLAS
444444
endif
445445

446446
OBJS_CUDA_TEMP_INST = $(patsubst %.cu,%.o,$(wildcard ggml-cuda/template-instances/fattn-wmma*.cu))
447+
OBJS_CUDA_TEMP_INST += $(patsubst %.cu,%.o,$(wildcard ggml-cuda/template-instances/mmq*.cu))
447448
ifdef LLAMA_CUDA_FA_ALL_QUANTS
448449
OBJS_CUDA_TEMP_INST += $(patsubst %.cu,%.o,$(wildcard ggml-cuda/template-instances/fattn-vec*.cu))
449450
else

0 commit comments

Comments
 (0)