musa: add docker image support (#9685)
* mtgpu: add docker image support Signed-off-by: Xiaodong Ye <xiaodong.ye@mthreads.com> * mtgpu: enable docker workflow Signed-off-by: Xiaodong Ye <xiaodong.ye@mthreads.com> --------- Signed-off-by: Xiaodong Ye <xiaodong.ye@mthreads.com>
This commit is contained in:
		
							parent
							
								
									c7499c557c
								
							
						
					
					
						commit
						cf8e0a3bb9
					
				
					 6 changed files with 134 additions and 3 deletions
				
			
		
							
								
								
									
										26
									
								
								.devops/full-musa.Dockerfile
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										26
									
								
								.devops/full-musa.Dockerfile
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,26 @@ | |||
| ARG UBUNTU_VERSION=22.04 | ||||
| # This needs to generally match the container host's environment. | ||||
| ARG MUSA_VERSION=rc3.1.0 | ||||
| # Target the MUSA build image | ||||
| ARG BASE_MUSA_DEV_CONTAINER=mthreads/musa:${MUSA_VERSION}-devel-ubuntu${UBUNTU_VERSION} | ||||
| 
 | ||||
| FROM ${BASE_MUSA_DEV_CONTAINER} AS build | ||||
| 
 | ||||
| RUN apt-get update && \ | ||||
|     apt-get install -y build-essential cmake python3 python3-pip git libcurl4-openssl-dev libgomp1 | ||||
| 
 | ||||
| COPY requirements.txt   requirements.txt | ||||
| COPY requirements       requirements | ||||
| 
 | ||||
| RUN pip install --upgrade pip setuptools wheel \ | ||||
|     && pip install -r requirements.txt | ||||
| 
 | ||||
| WORKDIR /app | ||||
| 
 | ||||
| COPY . . | ||||
| 
 | ||||
| RUN cmake -B build -DGGML_MUSA=ON -DLLAMA_CURL=ON ${CMAKE_ARGS} -DCMAKE_EXE_LINKER_FLAGS=-Wl,--allow-shlib-undefined . && \ | ||||
|     cmake --build build --config Release -j$(nproc) && \ | ||||
|     cp build/bin/* . | ||||
| 
 | ||||
| ENTRYPOINT ["/app/.devops/tools.sh"] | ||||
							
								
								
									
										30
									
								
								.devops/llama-cli-musa.Dockerfile
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										30
									
								
								.devops/llama-cli-musa.Dockerfile
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,30 @@ | |||
| ARG UBUNTU_VERSION=22.04 | ||||
| # This needs to generally match the container host's environment. | ||||
| ARG MUSA_VERSION=rc3.1.0 | ||||
| # Target the MUSA build image | ||||
| ARG BASE_MUSA_DEV_CONTAINER=mthreads/musa:${MUSA_VERSION}-devel-ubuntu${UBUNTU_VERSION} | ||||
| # Target the MUSA runtime image | ||||
| ARG BASE_MUSA_RUN_CONTAINER=mthreads/musa:${MUSA_VERSION}-runtime-ubuntu${UBUNTU_VERSION} | ||||
| 
 | ||||
| FROM ${BASE_MUSA_DEV_CONTAINER} AS build | ||||
| 
 | ||||
| RUN apt-get update && \ | ||||
|     apt-get install -y build-essential git cmake | ||||
| 
 | ||||
| WORKDIR /app | ||||
| 
 | ||||
| COPY . . | ||||
| 
 | ||||
| RUN cmake -B build -DGGML_MUSA=ON ${CMAKE_ARGS} -DCMAKE_EXE_LINKER_FLAGS=-Wl,--allow-shlib-undefined . && \ | ||||
|     cmake --build build --config Release --target llama-cli -j$(nproc) | ||||
| 
 | ||||
| FROM ${BASE_MUSA_RUN_CONTAINER} AS runtime | ||||
| 
 | ||||
| RUN apt-get update && \ | ||||
|     apt-get install -y libgomp1 | ||||
| 
 | ||||
| COPY --from=build /app/build/ggml/src/libggml.so /libggml.so | ||||
| COPY --from=build /app/build/src/libllama.so /libllama.so | ||||
| COPY --from=build /app/build/bin/llama-cli /llama-cli | ||||
| 
 | ||||
| ENTRYPOINT [ "/llama-cli" ] | ||||
							
								
								
									
										35
									
								
								.devops/llama-server-musa.Dockerfile
									
										
									
									
									
										Normal file
									
								
							
							
						
						
									
										35
									
								
								.devops/llama-server-musa.Dockerfile
									
										
									
									
									
										Normal file
									
								
							|  | @ -0,0 +1,35 @@ | |||
| ARG UBUNTU_VERSION=22.04 | ||||
| # This needs to generally match the container host's environment. | ||||
| ARG MUSA_VERSION=rc3.1.0 | ||||
| # Target the MUSA build image | ||||
| ARG BASE_MUSA_DEV_CONTAINER=mthreads/musa:${MUSA_VERSION}-devel-ubuntu${UBUNTU_VERSION} | ||||
| # Target the MUSA runtime image | ||||
| ARG BASE_MUSA_RUN_CONTAINER=mthreads/musa:${MUSA_VERSION}-runtime-ubuntu${UBUNTU_VERSION} | ||||
| 
 | ||||
| FROM ${BASE_MUSA_DEV_CONTAINER} AS build | ||||
| 
 | ||||
| RUN apt-get update && \ | ||||
|     apt-get install -y build-essential git cmake libcurl4-openssl-dev | ||||
| 
 | ||||
| WORKDIR /app | ||||
| 
 | ||||
| COPY . . | ||||
| 
 | ||||
| RUN cmake -B build -DGGML_MUSA=ON -DLLAMA_CURL=ON ${CMAKE_ARGS} -DCMAKE_EXE_LINKER_FLAGS=-Wl,--allow-shlib-undefined . && \ | ||||
|     cmake --build build --config Release --target llama-server -j$(nproc) | ||||
| 
 | ||||
| FROM ${BASE_MUSA_RUN_CONTAINER} AS runtime | ||||
| 
 | ||||
| RUN apt-get update && \ | ||||
|     apt-get install -y libcurl4-openssl-dev libgomp1 curl | ||||
| 
 | ||||
| COPY --from=build /app/build/ggml/src/libggml.so /libggml.so | ||||
| COPY --from=build /app/build/src/libllama.so /libllama.so | ||||
| COPY --from=build /app/build/bin/llama-server /llama-server | ||||
| 
 | ||||
| # Must be set to 0.0.0.0 so it can listen to requests from host machine | ||||
| ENV LLAMA_ARG_HOST=0.0.0.0 | ||||
| 
 | ||||
| HEALTHCHECK CMD [ "curl", "-f", "http://localhost:8080/health" ] | ||||
| 
 | ||||
| ENTRYPOINT [ "/llama-server" ] | ||||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue