llama2c : use a destructor to prevent memory leaks
This commit is contained in:
parent
634d7272b8
commit
a04a6990eb
1 changed files with 18 additions and 19 deletions
|
@ -75,7 +75,7 @@ typedef struct {
|
||||||
int seq_len; // max sequence length
|
int seq_len; // max sequence length
|
||||||
} Config;
|
} Config;
|
||||||
|
|
||||||
typedef struct {
|
struct TransformerWeights {
|
||||||
// token embedding table
|
// token embedding table
|
||||||
float* token_embedding_table; // (vocab_size, dim)
|
float* token_embedding_table; // (vocab_size, dim)
|
||||||
// weights for rmsnorms
|
// weights for rmsnorms
|
||||||
|
@ -97,7 +97,22 @@ typedef struct {
|
||||||
// float* freq_cis_imag; // (seq_len, dim/2)
|
// float* freq_cis_imag; // (seq_len, dim/2)
|
||||||
// (optional) classifier weights for the logits, on the last layer
|
// (optional) classifier weights for the logits, on the last layer
|
||||||
float* wcls;
|
float* wcls;
|
||||||
} TransformerWeights;
|
|
||||||
|
~TransformerWeights() {
|
||||||
|
delete[] token_embedding_table;
|
||||||
|
delete[] rms_att_weight;
|
||||||
|
delete[] rms_ffn_weight;
|
||||||
|
delete[] wq;
|
||||||
|
delete[] wk;
|
||||||
|
delete[] wv;
|
||||||
|
delete[] wo;
|
||||||
|
delete[] w1;
|
||||||
|
delete[] w2;
|
||||||
|
delete[] w3;
|
||||||
|
delete[] rms_final_weight;
|
||||||
|
delete[] wcls;
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
void malloc_weights(TransformerWeights* w, Config* p, bool shared_weights) {
|
void malloc_weights(TransformerWeights* w, Config* p, bool shared_weights) {
|
||||||
// we calloc instead of malloc to keep valgrind happy
|
// we calloc instead of malloc to keep valgrind happy
|
||||||
|
@ -173,21 +188,6 @@ int checkpoint_init_weights(TransformerWeights *w, Config* p, FILE* f, bool shar
|
||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
void free_weights(TransformerWeights* w) {
|
|
||||||
delete[] w->token_embedding_table;
|
|
||||||
delete[] w->rms_att_weight;
|
|
||||||
delete[] w->rms_ffn_weight;
|
|
||||||
delete[] w->wq;
|
|
||||||
delete[] w->wk;
|
|
||||||
delete[] w->wv;
|
|
||||||
delete[] w->wo;
|
|
||||||
delete[] w->w1;
|
|
||||||
delete[] w->w2;
|
|
||||||
delete[] w->w3;
|
|
||||||
delete[] w->rms_final_weight;
|
|
||||||
delete[] w->wcls;
|
|
||||||
}
|
|
||||||
|
|
||||||
void print_sample_weights(TransformerWeights *w){
|
void print_sample_weights(TransformerWeights *w){
|
||||||
printf("----- Quick print of first of the weight vales of all the variables\n");
|
printf("----- Quick print of first of the weight vales of all the variables\n");
|
||||||
printf("%f\n", w->token_embedding_table[0]);
|
printf("%f\n", w->token_embedding_table[0]);
|
||||||
|
@ -915,7 +915,7 @@ int main(int argc, char ** argv) {
|
||||||
return 1;
|
return 1;
|
||||||
}
|
}
|
||||||
Config config;
|
Config config;
|
||||||
TransformerWeights weights;
|
TransformerWeights weights = {};
|
||||||
{
|
{
|
||||||
FILE *file = fopen(params.fn_llama2c_model, "rb");
|
FILE *file = fopen(params.fn_llama2c_model, "rb");
|
||||||
if (!file) { printf("Unable to open the checkpoint file %s!\n", params.fn_llama2c_model); return 1; }
|
if (!file) { printf("Unable to open the checkpoint file %s!\n", params.fn_llama2c_model); return 1; }
|
||||||
|
@ -957,6 +957,5 @@ int main(int argc, char ** argv) {
|
||||||
printf("Saving llama.c model file %s in ggml format at %s\n", params.fn_llama2c_model, params.fn_llama2c_output_model);
|
printf("Saving llama.c model file %s in ggml format at %s\n", params.fn_llama2c_model, params.fn_llama2c_output_model);
|
||||||
|
|
||||||
ggml_free(model.ctx);
|
ggml_free(model.ctx);
|
||||||
free_weights(&weights);
|
|
||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue