mlx_quantized_matmul function

  1. @Native<Int Function(Pointer<mlx_array>, mlx_array, mlx_array, mlx_array, mlx_array, Bool, mlx_optional_int, mlx_optional_int, Pointer<Char>, mlx_stream)>(ffi.Pointer<mlx_array>, mlx_array, mlx_array, mlx_array, mlx_array, ffi.Bool, mlx_optional_int, mlx_optional_int, ffi.Pointer<ffi.Char>, mlx_stream)>()
int mlx_quantized_matmul(
  1. Pointer<mlx_array> res,
  2. mlx_array x,
  3. mlx_array w,
  4. mlx_array scales,
  5. mlx_array biases,
  6. bool transpose,
  7. mlx_optional_int group_size,
  8. mlx_optional_int bits,
  9. Pointer<Char> mode,
  10. mlx_stream s,
)

Implementation

@ffi.Native<
  ffi.Int Function(
    ffi.Pointer<mlx_array>,
    mlx_array,
    mlx_array,
    mlx_array,
    mlx_array,
    ffi.Bool,
    mlx_optional_int,
    mlx_optional_int,
    ffi.Pointer<ffi.Char>,
    mlx_stream,
  )
>()
external int mlx_quantized_matmul(
  ffi.Pointer<mlx_array> res,
  mlx_array x,
  mlx_array w,
  mlx_array scales,
  mlx_array biases,
  bool transpose,
  mlx_optional_int group_size,
  mlx_optional_int bits,
  ffi.Pointer<ffi.Char> mode,
  mlx_stream s,
);