improve f64 support (for convert mostly)

stduhpf · stduhpf · commit 5a508b02a9f0 · 2025-07-08T21:38:38.000+02:00
diff --git a/model.cpp b/model.cpp
@@ -835,6 +835,12 @@ void convert_tensor(void* src,
     } else if (src_type == GGML_TYPE_F32) {
         if (dst_type == GGML_TYPE_F16) {
             ggml_fp32_to_fp16_row((float*)src, (ggml_fp16_t*)dst, n);
+        } else if (dst_type == GGML_TYPE_F64) {
+            double* ddst = (double*)dst;
+            float* fsrc  = (float*)src;
+            for (int64_t i = 0; i < n; i++) {
+                ddst[i] = (double)(fsrc[i]);
+            }
         } else {
             std::vector<float> imatrix(n_per_row, 1.0f);  // dummy importance matrix
             const float* im = imatrix.data();
@@ -843,6 +849,41 @@ void convert_tensor(void* src,
     } else if (dst_type == GGML_TYPE_F32) {
         if (src_type == GGML_TYPE_F16) {
             ggml_fp16_to_fp32_row((ggml_fp16_t*)src, (float*)dst, n);
+        } else if (src_type == GGML_TYPE_F64) {
+            float* fdst  = (float*)dst;
+            double* dsrc = (double*)src;
+            for (int64_t i = 0; i < n; i++) {
+                fdst[i] = (float)(dsrc[i]);
+            }
+        } else {
+            auto qtype = ggml_get_type_traits(src_type);
+            if (qtype->to_float == NULL) {
+                throw std::runtime_error(format("type %s unsupported for integer quantization: no dequantization available",
+                                                ggml_type_name(src_type)));
+            }
+            qtype->to_float(src, (float*)dst, n);
+        }
+    } else if (src_type == GGML_TYPE_F64) {
+        if (dst_type == GGML_TYPE_F16) {
+            // ggml_fp32_to_fp16_row((float*)src, (ggml_fp16_t*)dst, n);
+            ggml_fp16_t* fdst = (ggml_fp16_t*)dst;
+            double* dsrc      = (double*)src;
+            for (int64_t i = 0; i < n; i++) {
+                fdst[i] = ggml_fp32_to_fp16((float)dsrc[i]);
+            }
+        } else {
+            std::vector<float> imatrix(n_per_row, 1.0f);  // dummy importance matrix
+            const float* im = imatrix.data();
+            ggml_quantize_chunk(dst_type, (float*)src, dst, 0, nrows, n_per_row, im);
+        }
+    } else if (dst_type == GGML_TYPE_F64) {
+        if (src_type == GGML_TYPE_F16) {
+            // ggml_fp16_to_fp32_row((ggml_fp16_t*)src, (float*)dst, n);
+            double* ddst      = (double*)dst;
+            ggml_fp16_t* fsrc = (ggml_fp16_t*)src;
+            for (int64_t i = 0; i < n; i++) {
+                ddst[i] = (double)ggml_fp16_to_fp32(fsrc[i]);
+            }
         } else {
             auto qtype = ggml_get_type_traits(src_type);
             if (qtype->to_float == NULL) {