From 7d6511b62a19ba2c737035cff9617c09a763464c Mon Sep 17 00:00:00 2001 From: Ariel Nunez <54999+ingenieroariel@users.noreply.github.com> Date: Thu, 11 May 2023 07:13:52 -0400 Subject: [PATCH] Added model download links. https://huggingface.co/ceonlabs/radpajama/tree/main --- third_party/radpajama/radpajama.cc | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/third_party/radpajama/radpajama.cc b/third_party/radpajama/radpajama.cc index 77db3c3fc..ab2c27dcf 100644 --- a/third_party/radpajama/radpajama.cc +++ b/third_party/radpajama/radpajama.cc @@ -2997,7 +2997,13 @@ static int on_missing_feature(const char *name) { int main(int argc, char ** argv) { gpt_params params; - params.model = "ggml-RedPajama-INCITE-Chat-3B-v1-q8_0.bin"; + // Models can be freely downloaded from: + // https://huggingface.co/ceonlabs/radpajama/tree/main + // Preferred one in float16 format, this can be used to generate the quantized one. + // ggml-RedPajama-INCITE-Chat-3B-v1-f16.bin 5.55GB + // Quantized for faster inference, 8bit integers. + // ggml-RedPajama-INCITE-Chat-3B-v1-q8_0.bin 3.13 GB + params.model = "ggml-RedPajama-INCITE-Chat-3B-v1-f16.bin"; if (gpt_params_parse(argc, argv, params) == false) { return 1;