mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-12 03:31:46 +00:00
imatrix : keep intermediate imatrix results (#5077)
Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
This commit is contained in:
parent
d6bd4d46dd
commit
15bceec2d7
@ -26,6 +26,7 @@ struct StatParams {
|
|||||||
std::string ofile = "imatrix.dat";
|
std::string ofile = "imatrix.dat";
|
||||||
int n_output_frequency = 10;
|
int n_output_frequency = 10;
|
||||||
int verbosity = 1;
|
int verbosity = 1;
|
||||||
|
int keep_every = 0;
|
||||||
bool collect_output_weight = false;
|
bool collect_output_weight = false;
|
||||||
};
|
};
|
||||||
|
|
||||||
@ -42,6 +43,9 @@ private:
|
|||||||
int m_last_call = 0;
|
int m_last_call = 0;
|
||||||
std::vector<float> m_src1_data;
|
std::vector<float> m_src1_data;
|
||||||
std::vector<int> m_ids; // the expert ids from ggml_mul_mat_id
|
std::vector<int> m_ids; // the expert ids from ggml_mul_mat_id
|
||||||
|
//
|
||||||
|
void save_imatrix(const char * file_name) const;
|
||||||
|
void keep_imatrix(int ncall) const;
|
||||||
};
|
};
|
||||||
|
|
||||||
bool IMatrixCollector::collect_imatrix(struct ggml_tensor * t, bool ask, void * user_data) {
|
bool IMatrixCollector::collect_imatrix(struct ggml_tensor * t, bool ask, void * user_data) {
|
||||||
@ -117,6 +121,9 @@ bool IMatrixCollector::collect_imatrix(struct ggml_tensor * t, bool ask, void *
|
|||||||
if (m_last_call % m_params.n_output_frequency == 0) {
|
if (m_last_call % m_params.n_output_frequency == 0) {
|
||||||
save_imatrix();
|
save_imatrix();
|
||||||
}
|
}
|
||||||
|
if (m_params.keep_every > 0 && m_last_call%m_params.keep_every == 0) {
|
||||||
|
keep_imatrix(m_last_call);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
@ -143,6 +150,9 @@ bool IMatrixCollector::collect_imatrix(struct ggml_tensor * t, bool ask, void *
|
|||||||
if (m_last_call % m_params.n_output_frequency == 0) {
|
if (m_last_call % m_params.n_output_frequency == 0) {
|
||||||
save_imatrix();
|
save_imatrix();
|
||||||
}
|
}
|
||||||
|
if (m_params.keep_every > 0 && m_last_call%m_params.keep_every == 0) {
|
||||||
|
keep_imatrix(m_last_call);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -150,7 +160,18 @@ bool IMatrixCollector::collect_imatrix(struct ggml_tensor * t, bool ask, void *
|
|||||||
}
|
}
|
||||||
|
|
||||||
void IMatrixCollector::save_imatrix() const {
|
void IMatrixCollector::save_imatrix() const {
|
||||||
const char * fname = m_params.ofile.empty() ? "imatrix.dat" : m_params.ofile.c_str();
|
save_imatrix(m_params.ofile.empty() ? "imatrix.dat" : m_params.ofile.c_str());
|
||||||
|
}
|
||||||
|
|
||||||
|
void IMatrixCollector::keep_imatrix(int ncall) const {
|
||||||
|
auto file_name = m_params.ofile;
|
||||||
|
if (file_name.empty()) file_name = "imatrix.dat";
|
||||||
|
file_name += ".at_";
|
||||||
|
file_name += std::to_string(ncall);
|
||||||
|
save_imatrix(file_name.c_str());
|
||||||
|
}
|
||||||
|
|
||||||
|
void IMatrixCollector::save_imatrix(const char * fname) const {
|
||||||
std::ofstream out(fname, std::ios::binary);
|
std::ofstream out(fname, std::ios::binary);
|
||||||
int n_entries = m_stats.size();
|
int n_entries = m_stats.size();
|
||||||
out.write((const char*)&n_entries, sizeof(n_entries));
|
out.write((const char*)&n_entries, sizeof(n_entries));
|
||||||
@ -400,6 +421,8 @@ int main(int argc, char ** argv) {
|
|||||||
sparams.verbosity = std::stoi(argv[++iarg]);
|
sparams.verbosity = std::stoi(argv[++iarg]);
|
||||||
} else if (arg == "--no-ppl") {
|
} else if (arg == "--no-ppl") {
|
||||||
compute_ppl = false;
|
compute_ppl = false;
|
||||||
|
} else if (arg == "--keep-imatrix") {
|
||||||
|
sparams.keep_every = std::stoi(argv[++iarg]);
|
||||||
} else {
|
} else {
|
||||||
args.push_back(argv[iarg]);
|
args.push_back(argv[iarg]);
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user