@@ -1209,6 +1209,11 @@ void aclnn_sin(ggml_backend_cann_context& ctx, aclTensor* acl_src,
1209
1209
GGML_CANN_CALL_ACLNN_OP (Sin, acl_src, acl_dst);
1210
1210
}
1211
1211
1212
+ void aclnn_geluv2 (ggml_backend_cann_context& ctx, aclTensor* acl_src,
1213
+ aclTensor* acl_dst) {
1214
+ GGML_CANN_CALL_ACLNN_OP (GeluV2, acl_src, 0 , acl_dst);
1215
+ }
1216
+
1212
1217
void ggml_cann_timestep_embedding (ggml_backend_cann_context& ctx,
1213
1218
ggml_tensor* dst) {
1214
1219
const ggml_tensor* src = dst->src [0 ];
@@ -1783,7 +1788,7 @@ void ggml_cann_get_rows(ggml_backend_cann_context& ctx, ggml_tensor* dst) {
1783
1788
src0->data , ACL_INT8, sizeof (int8_t ), weight_ne, weight_nb,
1784
1789
GGML_MAX_DIMS + 1 );
1785
1790
aclTensor* acl_scale_tensor = ggml_cann_create_tensor (
1786
- src0->data , ACL_FLOAT16, sizeof (float16_t ), scale_ne, scale_nb,
1791
+ src0->data , ACL_FLOAT16, sizeof (uint16_t ), scale_ne, scale_nb,
1787
1792
GGML_MAX_DIMS + 1 , ACL_FORMAT_ND, scale_offset);
1788
1793
aclTensor* dequant_tensor = ggml_cann_create_tensor (
1789
1794
dequant_buffer_allocator.get (), ACL_FLOAT, sizeof (float_t ),
0 commit comments