@@ -6546,11 +6546,11 @@ void ggml_compute_forward_im2col_back_f32(
6546
6546
}
6547
6547
}
6548
6548
6549
- static void ggml_call_mul_mat (ggml_type T , const ggml_compute_params * params, int64_t m, int64_t n, int64_t k,
6550
- void * a, void * b, void * c) {
6551
- const ggml_type_traits * traits = ggml_get_type_traits (T );
6549
+ static void ggml_call_mul_mat (ggml_type type , const ggml_compute_params * params, int64_t m, int64_t n, int64_t k,
6550
+ const void * a, const void * b, float * c) {
6551
+ const ggml_type_traits * traits = ggml_get_type_traits (type );
6552
6552
struct ggml_tensor src1 = {};
6553
- src1.type = T ;
6553
+ src1.type = type ;
6554
6554
src1.ne [0 ] = k;
6555
6555
src1.ne [1 ] = m;
6556
6556
src1.ne [2 ] = 1 ;
@@ -6559,10 +6559,10 @@ static void ggml_call_mul_mat(ggml_type T, const ggml_compute_params * params, i
6559
6559
src1.nb [1 ] = k * traits->type_size ;
6560
6560
src1.nb [2 ] = src1.nb [1 ];
6561
6561
src1.nb [3 ] = src1.nb [2 ];
6562
- src1.data = a;
6562
+ src1.data = ( void *) a;
6563
6563
6564
6564
struct ggml_tensor src0 = {};
6565
- src0.type = T ;
6565
+ src0.type = type ;
6566
6566
src0.ne [0 ] = k;
6567
6567
src0.ne [1 ] = n;
6568
6568
src0.ne [2 ] = 1 ;
@@ -6571,7 +6571,7 @@ static void ggml_call_mul_mat(ggml_type T, const ggml_compute_params * params, i
6571
6571
src0.nb [1 ] = k * traits->type_size ;
6572
6572
src0.nb [2 ] = src0.nb [1 ];
6573
6573
src0.nb [3 ] = src0.nb [2 ];
6574
- src0.data = b;
6574
+ src0.data = ( void *) b;
6575
6575
6576
6576
struct ggml_tensor dst = {};
6577
6577
dst.ne [0 ] = n;
@@ -6598,6 +6598,7 @@ static void ggml_compute_forward_conv_2d_impl(const ggml_compute_params * params
6598
6598
ggml_type kernel_type) {
6599
6599
6600
6600
GGML_ASSERT (ggml_is_contiguous (kernel));
6601
+ GGML_ASSERT (kernel_type == GGML_TYPE_F16 || kernel_type == GGML_TYPE_F32);
6601
6602
GGML_ASSERT (kernel->type == kernel_type);
6602
6603
6603
6604
const ggml_type_traits * traits = ggml_get_type_traits (kernel_type);
@@ -6620,9 +6621,9 @@ static void ggml_compute_forward_conv_2d_impl(const ggml_compute_params * params
6620
6621
const int64_t dst_w = dst->ne [0 ];
6621
6622
const int64_t dst_h = dst->ne [1 ];
6622
6623
6623
- float * src_data = (float *) src->data ;
6624
- void * knl_data = kernel->data ;
6625
- float * dst_data = (float *) dst->data ;
6624
+ const float * src_data = (float *) src->data ;
6625
+ void * knl_data = kernel->data ;
6626
+ float * dst_data = (float *) dst->data ;
6626
6627
6627
6628
const int64_t knl_n = knl_w * knl_h * c_in;
6628
6629
const int64_t patch_total = dst->ne [3 ] * dst_w * dst_h;
@@ -6676,7 +6677,7 @@ static void ggml_compute_forward_conv_2d_impl(const ggml_compute_params * params
6676
6677
if (kernel_type == GGML_TYPE_F32) {
6677
6678
*(float *) element_ptr = src_val;
6678
6679
} else if (kernel_type == GGML_TYPE_F16) {
6679
- *(ggml_fp16_t *) element_ptr = GGML_FP32_TO_FP16 (src_val);
6680
+ *(ggml_fp16_t *) element_ptr = GGML_CPU_FP32_TO_FP16 (src_val);
6680
6681
}
6681
6682
}
6682
6683
}
0 commit comments