metal : improve F32, F16 and BF16 mat-vec multiplication (#16057)
* metal : improve F32, F16 and BF16 mat-vec multiplication ggml-ci * metal : make the NSG a function constant in mul_mv kernels ggml-ci
This commit is contained in:
@@ -51,6 +51,10 @@ void ggml_metal_cv_free(ggml_metal_cv_t cv) {
|
||||
free(cv);
|
||||
}
|
||||
|
||||
void ggml_metal_cv_set_int16(ggml_metal_cv_t cv, int16_t value, int32_t idx) {
|
||||
[cv->obj setConstantValue:&value type:MTLDataTypeShort atIndex:idx];
|
||||
}
|
||||
|
||||
void ggml_metal_cv_set_int32(ggml_metal_cv_t cv, int32_t value, int32_t idx) {
|
||||
[cv->obj setConstantValue:&value type:MTLDataTypeInt atIndex:idx];
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user