diff --git a/examples/server/server.cpp b/examples/server/server.cpp
index 10c076262..c52962b5e 100644
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@@ -608,7 +608,7 @@ struct llama_server_context
         default_generation_settings_for_props = get_formatted_generation(slots.front());
         default_generation_settings_for_props["seed"] = -1;
 
-        batch = llama_batch_init(n_ctx_slot, 0, params.n_parallel);     // this works fine with the slot context and saves VRAM
+        batch = llama_batch_init(n_ctx, 0, params.n_parallel);     // this works fine with the slot context and saves VRAM
     }
 
     std::vector<llama_token> tokenize(const json & json_prompt, bool add_bos) const
@@ -1563,7 +1563,7 @@ struct llama_server_context
                 if (slot == nullptr)
                 {
                     // if no slot is available, we defer this task for processing later
-                    LOG_VERBOSE("no slot is available", {{"task_id", task.id}});
+                    LOG_VERBOSE("no slot is available", {"task_id", task.id});
                     queue_tasks.defer(task);
                     break;
                 } else {
@@ -3222,24 +3222,13 @@ int main(int argc, char **argv)
             return true;
         }
 
-        // Check for API key in the header
+        // Check for API key in the header (TODO: need to add username eventually but ...)
         auto auth_header = req.get_header_value("Authorization");
         std::string prefix = "Bearer ";
         if (auth_header.substr(0, prefix.size()) == prefix) {
             std::string received_api_key = auth_header.substr(prefix.size());
             LOG("Received API key = %s\n", received_api_key.c_str());
-            /*
-            for (int i = 0; i < int(sparams.api_keys.size()); i++) {
-                // for some reason the file apikeys are one character longer than those passed from Bearer so we shorten them
-                std::string uncut_api = sparams.api_keys[i]; // store original apikey
-                std::string cut_api = uncut_api.substr(0, uncut_api.size() - 1);    // do not shorten in-place by using erase
-                if (received_api_key != cut_api) {
-                    LOG("%s != %s and length left = %zu, length right = %zu\n", received_api_key.c_str(), cut_api.c_str(),received_api_key.size(), cut_api.size());
-                } else if (received_api_key == cut_api) {
-                    LOG("%s = %s Found matching api key.\n", received_api_key.c_str(), cut_api.c_str());
-                    return true;
-                }
-                */
+
             for (auto& item : sparams.api_keys) {
                 std::string username = item.first;
                 std::string apikey = item.second[0];
@@ -3250,9 +3239,6 @@ int main(int argc, char **argv)
                     }
                 }
             }
-            //if (std::find(sparams.api_keys.begin(), sparams.api_keys.end(), received_api_key) != sparams.api_keys.end()) {
-            //    return true; // API key is valid
-            //}
 
         // API key is invalid or not provided
         res.set_content("Unauthorized: Invalid API Key", "text/plain; charset=utf-8");
diff --git a/examples/server/utils.hpp b/examples/server/utils.hpp
index d8f03766e..a53effd20 100644
--- a/examples/server/utils.hpp
+++ b/examples/server/utils.hpp
@@ -16,21 +16,23 @@ using json = nlohmann::json;
 extern bool server_verbose;
 extern bool server_log_json;
 
-#ifndef SERVER_VERBOSE
+#ifndef SERVER_VERBOSE          // if not defined externally above, make it true and enable verbose logging
 #define SERVER_VERBOSE 1
 #endif
 
 #if SERVER_VERBOSE != 1
-#define LOG_VERBOSE(MSG, ...)
+#define LOG_VERBOSE(MSG, ...)   // if not verbose logging just return empty
 #else
 #define LOG_VERBOSE(MSG, ...)                                            \
     do                                                                   \
     {                                                                    \
         if (server_verbose)                                              \
         {                                                                \
-            server_log("VERB", __func__, __LINE__, MSG, __VA_ARGS__); \
+            server_log("VERB", __func__, __LINE__, MSG, __VA_ARGS__,     \
+               log_settings.stdout_target, log_settings.stdout_reset,    \
+               log_settings.stderr_target, log_settings.stderr_reset);   \
         }                                                                \
-    } while (0)
+    } while (0)     // this is always false so the loop only compiles once but is treated as a single statement
 #endif
 
 // ATTEMPT TO REFACTOR THE LOGGING BEHAVIOUR AND ALLOW REDIRECTION OF STDOUT, STDERR
@@ -38,9 +40,9 @@ extern bool server_log_json;
 struct LogRedirection {
   // Set default values for redirection targets and reset strings
   std::string stdout_target = "stdout_log.log";
-  std::string stdout_reset = "dev/tty";
+  std::string stdout_reset = "stdout";
   std::string stderr_target = "stderr_log.log";
-  std::string stderr_reset = "dev/tty";
+  std::string stderr_reset = "stderr";
 };
 
 LogRedirection log_settings;
@@ -61,14 +63,14 @@ LogRedirection log_settings;
                log_settings.stderr_target, log_settings.stderr_reset)
 
 /*
-// Example usage:
-LogRedirection default_settings;  // Use defaults
+// Example usage (WIP):
+LogRedirection default_settings;  // Use defaults but not necessary to say so
 LogRedirection custom_settings;
 
 // Modify values for custom settings if needed
-custom_settings.stdout_target = "/tmp/custom.log";
+log_settings.stdout_target = "/tmp/custom.log";
 
-LOG_ERROR("Default error", "Details", default_settings);
+LOG_ERROR("Default error", "Details", default_settings);    // can omit default_settings because it will default to log_settings unmodified
 LOG_ERROR("Custom error", "More info", custom_settings);
 
 
@@ -197,13 +199,12 @@ static inline void server_log(
     int line,
     const char *message,
     const nlohmann::ordered_json &extra,
-    // specify targets and resets for stdout and stderr;
+    // targets and resets for stdout and stderr are specified in LogRedirection above;
     // this allows different behaviour for LOG_ERROR, LOG_WARNING and LOG_INFO
-                 // destination for stdout redirection e.g. a file or "dev/null"
-    std::string stdout_target = "dev/stdout",
-    std::string stderr_target = "dev/tty",                // destination for stderr redirection
-    std::string stdout_reset = "dev/stderr",              // reset for stdout e.g. "dev/tty"
-    std::string stderr_reset = "dev/tty"
+    std::string stdout_target,
+    std::string stderr_target,
+    std::string stdout_reset,
+    std::string stderr_reset
 )
 {
     std::stringstream ss_tid;
@@ -214,7 +215,7 @@ static inline void server_log(
     };
 
     freopen(stdout_target.c_str(), "a", stdout);
-    freopen(stderr_target.c_str(), "w", stderr);      // we assign stderr to dev/null effectively 'blackholing' the output because log.dump below is redirected too
+    freopen(stderr_target.c_str(), "a", stderr);      // we assign stderr to dev/null effectively 'blackholing' the output because log.dump below is redirected too
 
     if (server_log_json) {
         log.merge_patch(
@@ -227,7 +228,7 @@ static inline void server_log(
         if (!extra.empty()) {
             log.merge_patch(extra);
         }
-        std::cerr << log.dump(-1, ' ', false, json::error_handler_t::replace) << "\n" << std::flush;    // was originally std:cout
+        std::cout << log.dump(-1, ' ', false, json::error_handler_t::replace) << "\n" << std::flush;    // was originally std:cout
 
     } else {                // store the logs in (because not json) text format
         char buf[1024];
@@ -276,8 +277,7 @@ inline bool verify_custom_template(const std::string & tmpl) {
 }
 
 // Format given chat. If tmpl is empty, we take the template from model metadata
-inline std::string format_chat(const struct llama_model * model, const std::string & tmpl, const std::vector<json> & messages)
-{
+inline std::string format_chat(const struct llama_model * model, const std::string & tmpl, const std::vector<json> & messages) {
     size_t alloc_size = 0;
     // vector holding all allocated string to be passed to llama_chat_apply_template
     std::vector<std::string> str(messages.size() * 2);
@@ -305,7 +305,7 @@ inline std::string format_chat(const struct llama_model * model, const std::stri
     }
 
     std::string formatted_chat(buf.data(), res);
-    LOG_VERBOSE("formatted_chat", {{"text", formatted_chat.c_str()}});
+    LOG_VERBOSE("formatted_chat", {"text", formatted_chat.c_str()});
 
     return formatted_chat;
 }
@@ -333,7 +333,7 @@ struct llama_server_queue {
         std::unique_lock<std::mutex> lock(mutex_tasks);
         if (task.id == -1) {
             task.id = id++;
-            LOG_VERBOSE("new task id", {{"new_id", task.id}});
+            LOG_VERBOSE("new task id", {"new_id", task.id});
         }
         queue_tasks.push_back(std::move(task));
         //LOG("Queue now has %2zu members.\n", queue_tasks.size());
@@ -352,7 +352,7 @@ struct llama_server_queue {
     int get_new_id() {
         std::unique_lock<std::mutex> lock(mutex_tasks);
         int new_id = id++;
-        LOG_VERBOSE("new task id", {{"new_id", new_id}});
+        LOG_VERBOSE("new task id", {"new_id", new_id});
         return new_id;
     }
 
@@ -410,7 +410,7 @@ struct llama_server_queue {
                     task_server task = queue_tasks.front();
                     queue_tasks.erase(queue_tasks.begin());
                     lock.unlock();
-                    LOG_VERBOSE("callback_new_task", {{"task_id", task.id}});
+                    LOG_VERBOSE("callback_new_task", {"task_id", task.id});
                     callback_new_task(task);
                 }
                 // process and update all the multitasks
@@ -490,14 +490,14 @@ struct llama_server_response {
     std::condition_variable condition_results;
 
     void add_waiting_task_id(int task_id) {
-        LOG_VERBOSE("waiting for task id", {{"task_id", task_id}});
+        LOG_VERBOSE("waiting for task id", {"task_id", task_id});
         std::unique_lock<std::mutex> lock(mutex_results);
         waiting_task_ids.insert(task_id);
         LOG("Waiting task list size after addition: %2zu.\n", waiting_task_ids.size());
     }
 
     void remove_waiting_task_id(int task_id) {
-        LOG_VERBOSE("remove waiting for task id", {{"task_id", task_id}});
+        LOG_VERBOSE("remove waiting for task id", {"task_id", task_id});
         std::unique_lock<std::mutex> lock(mutex_results);
         waiting_task_ids.erase(task_id);
         LOG("Waiting task list size after removal: %zu.\n", waiting_task_ids.size());
@@ -535,20 +535,20 @@ struct llama_server_response {
     // Send a new result to a waiting task_id
     void send(task_result result) {
         std::unique_lock<std::mutex> lock(mutex_results);
-        LOG_VERBOSE("send new result", {{"task_id", result.id}});
+        LOG_VERBOSE("send new result", {"task_id", result.id});
         for (auto& task_id : waiting_task_ids) {
             // LOG("waiting task id %i \n", task_id);
             // for now, tasks that have associated parent multitasks just get erased once multitask picks up the result
             if (result.multitask_id == task_id)
             {
-                LOG_VERBOSE("callback_update_multitask", {{"task_id", task_id}});
+                LOG_VERBOSE("callback_update_multitask", {"task_id", task_id});
                 callback_update_multitask(task_id, result.id, result);
                 continue;
             }
 
             if (result.id == task_id)
             {
-                LOG_VERBOSE("queue_results.push_back", {{"task_id", task_id}});
+                LOG_VERBOSE("queue_results.push_back", {"task_id", task_id});
                 queue_results.push_back(result);
                 condition_results.notify_all();
                 return;