fix imatrix collection on CPU backend

stduhpf · stduhpf · commit a386ba9f2829 · 2025-04-01T14:20:15.000+02:00
diff --git a/imatrix.cpp b/imatrix.cpp
@@ -42,7 +42,7 @@ bool IMatrixCollector::collect_imatrix(struct ggml_tensor* t, bool ask, void* us
             return false;
         // why are small batches ignored (<16 tokens)?
         // if (src1->ne[1] < 16 || src1->type != GGML_TYPE_F32) return false;
-        if (!(wname.substr(0, 6) == "model." || wname.substr(0, 17) == "cond_stage_model." || wname.substr(0,14) == "text_encoders."))
+        if (!(wname.substr(0, 6) == "model." || wname.substr(0, 17) == "cond_stage_model." || wname.substr(0, 14) == "text_encoders."))
             return false;
         return true;
     }
@@ -51,7 +51,7 @@ bool IMatrixCollector::collect_imatrix(struct ggml_tensor* t, bool ask, void* us
     std::lock_guard<std::mutex> lock(m_mutex);
 
     // copy the data from the GPU memory if needed
-    const bool is_host = ggml_backend_buffer_is_host(src1->buffer);
+    const bool is_host = src1->buffer == NULL || ggml_backend_buffer_is_host(src1->buffer);
 
     if (!is_host) {
         m_src1_data.resize(ggml_nelements(src1));
@@ -144,10 +144,9 @@ bool IMatrixCollector::collect_imatrix(struct ggml_tensor* t, bool ask, void* us
         }
     }
     return true;
-
 }
 
-void IMatrixCollector::save_imatrix(std::string fname,int ncall) const {
+void IMatrixCollector::save_imatrix(std::string fname, int ncall) const {
     LOG_INFO("SAVING_IMATRIX to %s\n", fname.c_str());
 
     if (ncall > 0) {

Original file line number	Diff line number	Diff line change
`@@ -42,7 +42,7 @@ bool IMatrixCollector::collect_imatrix(struct ggml_tensor* t, bool ask, void* us`
`42`	`42`	`return false;`
`43`	`43`	`// why are small batches ignored (<16 tokens)?`
`44`	`44`	`// if (src1->ne[1] < 16 \|\| src1->type != GGML_TYPE_F32) return false;`
`45`		`- if (!(wname.substr(0, 6) == "model." \|\| wname.substr(0, 17) == "cond_stage_model." \|\| wname.substr(0,14) == "text_encoders."))`
	`45`	`+ if (!(wname.substr(0, 6) == "model." \|\| wname.substr(0, 17) == "cond_stage_model." \|\| wname.substr(0, 14) == "text_encoders."))`
`46`	`46`	`return false;`
`47`	`47`	`return true;`
`48`	`48`	`}`
`@@ -51,7 +51,7 @@ bool IMatrixCollector::collect_imatrix(struct ggml_tensor* t, bool ask, void* us`
`51`	`51`	`std::lock_guard<std::mutex> lock(m_mutex);`
`52`	`52`
`53`	`53`	`// copy the data from the GPU memory if needed`
`54`		`- const bool is_host = ggml_backend_buffer_is_host(src1->buffer);`
	`54`	`+ const bool is_host = src1->buffer == NULL \|\| ggml_backend_buffer_is_host(src1->buffer);`
`55`	`55`
`56`	`56`	`if (!is_host) {`
`57`	`57`	`m_src1_data.resize(ggml_nelements(src1));`
`@@ -144,10 +144,9 @@ bool IMatrixCollector::collect_imatrix(struct ggml_tensor* t, bool ask, void* us`
`144`	`144`	`}`
`145`	`145`	`}`
`146`	`146`	`return true;`
`147`		`-`
`148`	`147`	`}`
`149`	`148`
`150`		`-void IMatrixCollector::save_imatrix(std::string fname,int ncall) const {`
	`149`	`+void IMatrixCollector::save_imatrix(std::string fname, int ncall) const {`
`151`	`150`	`LOG_INFO("SAVING_IMATRIX to %s\n", fname.c_str());`
`152`	`151`
`153`	`152`	`if (ncall > 0) {`