recognize q8_0 as an older format as the new clblast doesnt work correctly with it
This commit is contained in:
parent
49d6334dc1
commit
8a5fe628df
2 changed files with 13 additions and 5 deletions
|
@ -248,7 +248,7 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in
|
|||
}
|
||||
if (file_format < FileFormat::GGJT_2)
|
||||
{
|
||||
printf("\n---\nWarning: Your model has an INVALID or OUTDATED format (ver %d). Please reconvert it for better results!\n---\n", file_format);
|
||||
printf("\n---\nWarning: Your model may be an OUTDATED format (ver %d). Please reconvert it for better results!\n---\n", file_format);
|
||||
}
|
||||
|
||||
if (lora_filename != "")
|
||||
|
|
|
@ -146,9 +146,17 @@ void print_tok_vec(std::vector<float> &embd)
|
|||
else if(magic == 0x67676a74) //v3 format ggjt
|
||||
{
|
||||
fileformat = FileFormat::GGJT_2; //ggjt by default
|
||||
uint32_t temp;
|
||||
fin.read((char *)&temp, sizeof(temp)); //file version
|
||||
if(temp==1)
|
||||
uint32_t ver, temp, ftype;
|
||||
fin.read((char *)&ver, sizeof(ver)); //file version
|
||||
fin.read((char *)&temp, sizeof(temp));//vocab
|
||||
fin.read((char *)&temp, sizeof(temp)); //embd
|
||||
fin.read((char *)&temp, sizeof(temp)); //mult
|
||||
fin.read((char *)&temp, sizeof(temp));//head
|
||||
fin.read((char *)&temp, sizeof(temp));//layer
|
||||
fin.read((char *)&temp, sizeof(temp));//rot
|
||||
fin.read((char *)&ftype, sizeof(ftype));//filetype
|
||||
|
||||
if(ver==1 || ftype==7) //q8 formats treat as old one
|
||||
{
|
||||
fileformat = FileFormat::GGJT;
|
||||
}
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue