From f4217a81fc181e43e42d3c019df97906be31663b Mon Sep 17 00:00:00 2001
From: Aleksei Nikiforov <aleksei.nikiforov@linux.ibm.com>
Date: Tue, 21 Jan 2025 12:15:34 +0100
Subject: [PATCH] Disable mmap on s390x in llama-quant too

---
 src/llama-quant.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/llama-quant.cpp b/src/llama-quant.cpp
index fb7982655..c91af4cbd 100644
--- a/src/llama-quant.cpp
+++ b/src/llama-quant.cpp
@@ -514,7 +514,7 @@ static void llama_model_quantize_impl(const std::string & fname_inp, const std::
 
     // mmap consistently increases speed Linux, and also increases speed on Windows with
     // hot cache. It may cause a slowdown on macOS, possibly related to free memory.
-#if defined(__linux__) || defined(_WIN32)
+#if (defined(__linux__) && !defined(__s390x__)) || defined(_WIN32)
     constexpr bool use_mmap = true;
 #else
     constexpr bool use_mmap = false;