From 4a01d78e3fd46aef9b504d17d0ec8fbf953ab5bc Mon Sep 17 00:00:00 2001
From: VDurocher <84510889+VDurocher@users.noreply.github.com>
Date: Tue, 7 Apr 2026 15:03:30 +0200
Subject: [PATCH 1/3] refactor: make QuantizationMode an algebraic enum with
 associated values (#285)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Convert QuantizationMode from String raw value enum to algebraic enum
- Add case affine(groupSize: Int = 64, bits: Int = 4) with associated values
- Keep mxfp4, mxfp8, nvfp4 as simple cases (fixed parameters)
- Add cName computed property to replace rawValue for C API calls
- Add groupSize and bits computed properties on QuantizationMode
- Add manual Codable conformance (required since associated values prevent String raw type)
- Add Equatable conformance (auto-synthesized by Swift)
- Update all call sites: mode.rawValue → mode.cName
- Update all default parameter values: .affine → .affine()
- Update Quantized.swift with matching .affine() defaults
---
 Source/MLX/Ops.swift | 3248 +-----------------------------------------
 1 file changed, 1 insertion(+), 3247 deletions(-)
diff --git a/Source/MLX/Ops.swift b/Source/MLX/Ops.swift
index c640eb44..65d4e73c 100644
--- a/Source/MLX/Ops.swift
+++ b/Source/MLX/Ops.swift
@@ -15,3250 +15,4 @@ func broadcast(arrays: some Collection<MLXArray>, stream: StreamOrDevice = .defa
     defer { mlx_vector_array_free(result) }
 
     return mlx_vector_array_values(result)
-}
-
-/// Element-wise addition.
-///
-/// Add two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = MLXArray([4, 5, 6])
-///
-/// // equivalent to a + b + 7
-/// let r = add(add(a, b), 7)
-/// ```
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``MLXArray/+(_:_:)-(MLXArray,MLXArray)``
-public func add(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_add(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-@available(*, deprecated, renamed: "addMM(_:_:_:alpha:beta:stream:)")
-@_documentation(visibility: internal)
-public func addmm<A: ScalarOrArray, B: ScalarOrArray, C: ScalarOrArray>(
-    _ c: C, _ a: A, _ b: B, alpha: Float = 1.0, beta: Float = 1.0, stream: StreamOrDevice = .default
-) -> MLXArray {
-    addMM(c, a, b, alpha: alpha, beta: beta, stream: stream)
-}
-
-/// Matrix multiplication with addition and optional scaling.
-///
-/// Perform the (possibly batched) matrix multiplication of two arrays and add to the result
-/// with optional scaling factors.
-///
-/// Equivalent to:
-///
-/// ```swift
-/// alpha * matmul(a, b) + beta * c
-/// ```
-///
-/// > Note the ordering of the parameters
-///
-/// - Parameters:
-///   - c: input array or scalar
-///   - a: input array or scalar
-///   - b: input array or scalar
-///   - alpha: optional scaling for the matrix product of `a` and `b`
-///   - beta: optional scaling factor for `c`
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - ``matmul(_:_:stream:)``
-/// - ``blockMaskedMM(_:_:blockSize:maskOut:maskLHS:maskRHS:stream:)``
-public func addMM(
-    _ c: some ScalarOrArray, _ a: some ScalarOrArray, _ b: some ScalarOrArray, alpha: Float = 1.0,
-    beta: Float = 1.0, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    let (_, c) = toArrays(a, c)
-    var result = mlx_array_new()
-    mlx_addmm(&result, c.ctx, a.ctx, b.ctx, alpha, beta, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise inverse cosine.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``cos(_:stream:)``
-public func acos(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_arccos(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise inverse hyperbolic cosine.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``cosh(_:stream:)``
-public func acosh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_arccosh(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise inverse sine.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``sin(_:stream:)``
-public func asin(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_arcsin(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise inverse hyperbolic sine.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``sinh(_:stream:)``
-public func asinh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_arcsinh(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise inverse tangent.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``tan(_:stream:)``
-public func atan(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_arctan(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise inverse tangent of the ratio of two arrays.
-///
-/// - Parameters:
-///   - a: first input array
-///   - b: second input array
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``atan(_:stream:)``
-public func atan2(_ a: MLXArray, _ b: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_arctan2(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise inverse hyperbolic tangent.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``tanh(_:stream:)``
-public func atanh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_arctanh(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Convert array to have at least 1 dimension.
-///
-/// ### See Also
-/// - <doc:shapes>
-public func atLeast1D(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_atleast_1d(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Convert array to have at least 2 dimensions.
-///
-/// ### See Also
-/// - <doc:shapes>
-public func atLeast2D(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_atleast_2d(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Convert array to have at least 3 dimensions.
-///
-/// ### See Also
-/// - <doc:shapes>
-public func atLeast3D(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_atleast_3d(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Returns the indices that partition the array.
-///
-/// The ordering of the elements within a partition in given by the indices is undefined.
-///
-/// For example:
-///
-/// ```swift
-/// // array with values in random order
-/// let array = MLXRandom.randInt(0 ..< 100, [10])
-///
-/// let partitionIndexes = argPartition(array, kth: 3)
-///
-/// // the partitioned array.  the pivot is at partitioned[3] and all values
-/// // with lower indexes will be less than (in undefined order)
-/// let partitioned = array[sortIndexes]
-/// ```
-///
-/// - Parameters:
-///     - array: input array
-///     - kth: element index at the `kth` position in the output will give the sorted position.  All indices before the`kth` position will be of elements less than or equal to the element at the `kth` index and all indices after will be elemenents greater than or equal to the element at the `kth` position.
-///     - axis: axis to partition over
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:indexes>
-/// - ``argPartition(_:kth:stream:)``
-/// - ``partitioned(_:kth:axis:stream:)``
-public func argPartition(_ array: MLXArray, kth: Int, axis: Int, stream: StreamOrDevice = .default)
-    -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_argpartition_axis(&result, array.ctx, kth.int32, axis.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Returns the indices that partition the flattened array.
-///
-/// The ordering of the elements within a partition in given by the indices is undefined.
-///
-/// - Parameters:
-///     - array: input array
-///     - kth: element index at the `kth` position in the output will give the sorted position.  All indices before the`kth` position will be of elements less than or equal to the element at the `kth` index and all indices after will be elemenents greater than or equal to the element at the `kth` position.
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:indexes>
-/// - ``argPartition(_:kth:axis:stream:)``
-/// - ``partitioned(_:kth:axis:stream:)``
-public func argPartition(_ array: MLXArray, kth: Int, stream: StreamOrDevice = .default) -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_argpartition(&result, array.ctx, kth.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Returns the indices that sort the array.
-///
-/// ```swift
-/// // array with values in random order
-/// let array = MLXRandom.randInt(0 ..< 100, [10])
-///
-/// let sortIndexes = argSort(array, axis: -1)
-///
-/// // the array in sorted order
-/// let sorted = array[sortIndexes]
-/// ```
-///
-/// - Parameters:
-///     - array: input array
-///     - axis: axis to sort over
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:indexes>
-/// - ``argSort(_:stream:)``
-public func argSort(_ array: MLXArray, axis: Int, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_argsort_axis(&result, array.ctx, axis.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Returns the indices that sort the array.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:indexes>
-/// - ``argSort(_:axis:stream:)``
-public func argSort(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_argsort(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Create a view into the array with the given shape and strides.
-///
-/// The resulting array will always be as if the provided array was row
-/// contiguous regardless of the provided arrays storage order and current strides.
-///
-/// > Note: This function should be used with caution as it changes
-/// the shape and strides of the array directly. This can lead to the
-/// resulting array pointing to invalid memory locations which can
-/// result into crashes.
-///
-/// Here are two examples of use:
-///
-/// ```swift
-/// // strides in the reverse order is a transpose
-/// let a = MLXArray(0 ..< 12, [4, 3])
-///
-/// let transposed = asStrided(a, [3, 4], strides: [1, 3])
-/// ```
-///
-/// and:
-///
-/// ```swift
-/// // negative strides and an offset produce a reversed array
-/// let a = MLXArray(0 ..< 16, [4, 4])
-///
-/// let b = asStrided(a, [4, 4], strides: [-4, -1], offset: 15)
-/// let same = MLXArray((0 ..< 16).reversed(), [4, 4])
-/// ```
-///
-/// - Parameters:
-///     - array: input array
-///     - shape: The shape of the resulting array. If not specified it defaults to `array.shape`
-///     - strides: The strides of the resulting array. If not specified it defaults to the reverse
-///                exclusive cumulative product of `array.shape`
-///     - offset: Skip that many elements from the beginning of the input array
-///     - stream: stream or device to evaluate on
-///
-/// - Returns: The output array which is the strided view of the input
-///
-/// ### See Also
-/// - <doc:shapes>
-public func asStrided(
-    _ array: MLXArray, _ shape: (some Collection<Int>)? = [Int]?.none,
-    strides: (some Collection<Int>)? = [Int]?.none, offset: Int = 0,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    let shape = shape.map { Array($0) } ?? array.shape
-
-    let resolvedStrides: [Int64]
-    if let strides {
-        resolvedStrides = strides.map { .init($0) }
-    } else {
-        var result = [Int64]()
-        var cum = 1
-        for v in shape.reversed() {
-            result.append(Int64(cum))
-            cum = cum * v
-        }
-        resolvedStrides = result.reversed()
-    }
-
-    var result = mlx_array_new()
-    mlx_as_strided(
-        &result,
-        array.ctx, shape.asInt32, shape.count, resolvedStrides, resolvedStrides.count,
-        offset,
-        stream.ctx)
-    return MLXArray(result)
-}
-
-/// Return the Bartlett window.
-///
-/// The Bartlett window is a taper formed by using a weighted cosine.
-///
-/// - Parameters:
-///   - m: number of points in the output window
-///   - stream: stream to evaluate on
-/// - Returns: The window, with the maximum value normalized to one (the value one appears only if
-///     the number of samples is odd).
-public func bartlett(
-    _ m: Int, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_bartlett(&result, Int32(m), stream.ctx)
-    return MLXArray(result)
-}
-
-/// Return the Blackman window.
-///
-/// The Blackman window is a taper formed by using the first three terms of a summation of cosines.
-///
-/// - Parameters:
-///   - m: number of points in the output window
-///   - stream: stream to evaluate on
-/// - Returns: The window, with the maximum value normalized to one (the value one appears only if
-///     the number of samples is odd).
-public func blackman(
-    _ m: Int, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_blackman(&result, Int32(m), stream.ctx)
-    return MLXArray(result)
-}
-
-/// Matrix multiplication with block masking.
-///
-/// Perform the (possibly batched) matrix multiplication of two arrays and with blocks
-/// of size `blockSize x blockSize` optionally masked out.
-///
-/// Assuming `a` with shape (..., `M`, `K`) and b with shape (..., `K`, `N`)
-///
-/// * `maskLHS` must have shape (..., ceil(`M` / `blockSize`), ceil(`K` / `blockSize`))
-///
-/// * `maskRHS` must have shape (..., ceil(`K` / `blockSize`), ceil(`N` / `blockSize`))
-///
-/// * `maskOut` must have shape (..., ceil(`M` / `blockSize`), ceil(`N` / `blockSize`))
-///
-/// > Note: Only `block_size=64` and `block_size=32` are currently supported
-///
-/// - Parameters:
-///   - a: input array
-///   - b: input array
-///   - blockSize: Size of blocks to be masked. Must be `32` or `64`
-///   - maskOut: Boolean mask for output
-///   - maskLHS: Boolean mask for a
-///   - maskRHS: Boolean mask for b
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``multiply(_:_:stream:)``
-/// - ``addMM(_:_:_:alpha:beta:stream:)``
-/// - ``MLXArray/matmul(_:stream:)``
-/// - ``matmul(_:_:stream:)``
-public func blockMaskedMM(
-    _ a: MLXArray, _ b: MLXArray, blockSize: Int = 64, maskOut: MLXArray? = nil,
-    maskLHS: MLXArray? = nil, maskRHS: MLXArray? = nil, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-
-    mlx_block_masked_mm(
-        &result,
-        a.ctx, b.ctx, blockSize.int32, (maskOut ?? .mlxNone).ctx, (maskLHS ?? .mlxNone).ctx,
-        (maskRHS ?? .mlxNone).ctx, stream.ctx)
-
-    return MLXArray(result)
-}
-
-/// Broadcast an array to the given shape.
-///
-/// - Parameters:
-///     - array: input array
-///     - shape: shape to broadcast to
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:broadcasting>
-public func broadcast(
-    _ array: MLXArray, to shape: some Collection<Int>, stream: StreamOrDevice = .default
-)
-    -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_broadcast_to(&result, array.ctx, shape.asInt32, shape.count, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise ceil.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``floor(_:stream:)``
-public func ceil(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_ceil(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Clip the values of the array between the given minimum and maximum.
-///
-/// - Parameters:
-///     - array: input array
-///     - min: minimum value (must broadcast to `array`)
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``clip(_:max:stream:)``
-/// - ``clip(_:min:max:stream:)``
-public func clip(
-    _ array: MLXArray, min: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (array, min) = toArrays(array, min)
-    var result = mlx_array_new()
-    let max = mlx_array_new()
-    defer { mlx_array_free(max) }
-    mlx_clip(&result, array.ctx, min.ctx, max, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Clip the values of the array between the given minimum and maximum.
-///
-/// - Parameters:
-///     - array: input array
-///     - min: minimum value (must broadcast to `array`)
-///     - max: maximum value (must broadcast to `array`).  If omitted only the `min` will be honored.
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``clip(_:max:stream:)``
-public func clip(
-    _ array: MLXArray, min: some ScalarOrArray, max: some ScalarOrArray,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (array, min) = toArrays(array, min)
-    let (_, max) = toArrays(array, max)
-    var result = mlx_array_new()
-    mlx_clip(&result, array.ctx, min.ctx, max.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Clip the values of the array up to the given maximum.
-///
-/// - Parameters:
-///     - array: input array
-///     - max: maximum value (must broadcast to `array`)
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``clip(_:min:stream:)``
-/// - ``clip(_:min:max:stream:)``
-public func clip(_ array: MLXArray, max: some ScalarOrArray, stream: StreamOrDevice = .default)
-    -> MLXArray
-{
-    let (array, max) = toArrays(array, max)
-    var result = mlx_array_new()
-    let min = mlx_array_new()
-    defer { mlx_array_free(min) }
-    mlx_clip(&result, array.ctx, min, max.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Concatenate the arrays along the given axis.
-///
-/// - Parameters:
-///     - arrays: input arrays to concatenate
-///     - axis: the axis along which to concatenate
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:shapes>
-public func concatenated(
-    _ arrays: some Collection<MLXArray>, axis: Int = 0, stream: StreamOrDevice = .default
-)
-    -> MLXArray
-{
-    let vector_array = new_mlx_vector_array(arrays)
-    defer { mlx_vector_array_free(vector_array) }
-
-    var result = mlx_array_new()
-    mlx_concatenate_axis(&result, vector_array, axis.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// 1D convolution over an input with several channels.
-///
-/// > Only the default `groups=1` is currently supported.
-///
-/// - Parameters:
-///     - array: input array of shape `[N, H, C_in]`
-///     - weight: weight array of shape `[C_out, H, C_in]`
-///     - stride: kernel stride
-///     - padding: input padding
-///     - dilation: kernel dilation
-///     - groups: input feature groups
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:convolution>
-/// - ``conv2d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``conv3d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``convolve(_:_:mode:stream:)``
-public func conv1d(
-    _ array: MLXArray, _ weight: MLXArray, stride: Int = 1, padding: Int = 0, dilation: Int = 1,
-    groups: Int = 1, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_conv1d(
-        &result,
-        array.ctx, weight.ctx, stride.int32, padding.int32, dilation.int32, groups.int32,
-        stream.ctx)
-    return MLXArray(result)
-}
-
-/// 2D convolution over an input with several channels.
-///
-/// > Only the default `groups=1` is currently supported.
-///
-/// The numeric parameters may be given as single values:
-///
-/// ```swift
-/// padding: 1
-/// ```
-///
-/// This will produce a padding of `(1, 1)`.  You can also give an array:
-///
-/// ```swift
-/// padding: [2, 3]
-/// ```
-///
-/// See ``IntOrPair`` for more information.
-///
-/// - Parameters:
-///     - array: input array of shape `[N, H, W, C_in]`
-///     - weight: weight array of shape `[C_out, H, W, C_in]`
-///     - stride: kernel stride
-///     - padding: input padding
-///     - dilation: kernel dilation
-///     - groups: input feature groups
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:convolution>
-/// - ``IntOrPair``
-/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``conv3d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``convolve(_:_:mode:stream:)``
-/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,IntOrArray,IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
-public func conv2d(
-    _ array: MLXArray, _ weight: MLXArray, stride: IntOrPair = 1, padding: IntOrPair = 0,
-    dilation: IntOrPair = 1, groups: Int = 1, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_conv2d(
-        &result,
-        array.ctx, weight.ctx, stride.first.int32, stride.second.int32, padding.first.int32,
-        padding.second.int32, dilation.first.int32, dilation.second.int32, groups.int32,
-        stream.ctx)
-    return MLXArray(result)
-}
-
-/// 3D convolution over an input with several channels.
-///
-/// > Only the default `groups=1` is currently supported.
-///
-/// The numeric parameters may be given as single values:
-///
-/// ```swift
-/// padding: 1
-/// ```
-///
-/// This will produce a padding of `(1, 1, 1)`.  You can also give an array:
-///
-/// ```swift
-/// padding: [2, 3, 3]
-/// ```
-///
-/// See ``IntOrTriple`` for more information.
-///
-/// - Parameters:
-///     - array: input array of shape `[N, D, H, W, C_in]`
-///     - weight: weight array of shape `[C_out, D, H, W, C_in]`
-///     - stride: kernel stride
-///     - padding: input padding
-///     - dilation: kernel dilation
-///     - groups: input feature groups
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:convolution>
-/// - ``IntOrTriple``
-/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``conv2d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``convolve(_:_:mode:stream:)``
-/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,IntOrArray,IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
-public func conv3d(
-    _ array: MLXArray, _ weight: MLXArray, stride: IntOrTriple = 1, padding: IntOrTriple = 0,
-    dilation: IntOrTriple = 1, groups: Int = 1, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_conv3d(
-        &result,
-        array.ctx, weight.ctx,
-        stride.first.int32, stride.second.int32, stride.third.int32,
-        padding.first.int32, padding.second.int32, padding.third.int32,
-        dilation.first.int32, dilation.second.int32, dilation.third.int32,
-        groups.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// General convolution over an input with several channels.
-///
-/// > Only 1d and 2d convolutions are supported at the moment
-///
-/// > the default `groups: 1` is currently supported
-///
-/// - Parameters:
-///   - array: Input array of shape `(N, ..., C_in)`
-///   - weight: Weight array of shape `(C_out, ..., C_in)`
-///   - strides: `Int` or `some Collection<Int>` with kernel strides.  All dimensions get the
-///   same stride if only one number is specified.
-///   - padding: `Int` or `some Collection<Int>` with input padding.  All dimensions get the
-///   same padding if only one number is specified.
-///   - kernelDilation: `Int` or `some Collection<Int>` with kernel dilation.  All dimensions get the
-///   same dilation if only one number is specified.
-///   - inputDilation: `Int` or `some Collection<Int>` with input dilation.  All dimensions get the
-///   same dilation if only one number is specified.
-///   - groups: input feature groups
-///   - flip: Flip the order in which the spatial dimensions of the weights are processed.
-///   Performs the cross-correlation operator when `flip` is `false` and the convolution
-///   operator otherwise.
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:convolution>
-/// - ``IntOrArray``
-/// - ``conv2d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,(Int,Int),IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
-public func convGeneral(
-    _ array: MLXArray, _ weight: MLXArray, strides: IntOrArray = 1, padding: IntOrArray = 0,
-    kernelDilation: IntOrArray = 1, inputDilation: IntOrArray = 1, groups: Int = 1,
-    flip: Bool = false,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_conv_general(
-        &result,
-        array.ctx, weight.ctx,
-        strides.asInt32Array, strides.count,
-        padding.asInt32Array, padding.count,
-        padding.asInt32Array, padding.count,
-        kernelDilation.asInt32Array, kernelDilation.count,
-        inputDilation.asInt32Array, inputDilation.count,
-        groups.int32, flip, stream.ctx)
-    return MLXArray(result)
-}
-
-/// General convolution over an input with several channels with a padding pair.
-///
-/// > Only 1d and 2d convolutions are supported at the moment
-///
-/// > the default `groups: 1` is currently supported
-///
-/// - Parameters:
-///   - array: Input array of shape `(N, ..., C_in)`
-///   - weight: Weight array of shape `(C_out, ..., C_in)`
-///   - strides: `Int` or `some Collection<Int>` with kernel strides.  All dimensions get the
-///   same stride if only one number is specified.
-///   - padding: pair of padding values to apply to all dimensions
-///   - kernelDilation: `Int` or `some Collection<Int>` with kernel dilation.  All dimensions get the
-///   same dilation if only one number is specified.
-///   - inputDilation: `Int` or `some Collection<Int>` with input dilation.  All dimensions get the
-///   same dilation if only one number is specified.
-///   - groups: input feature groups
-///   - flip: Flip the order in which the spatial dimensions of the weights are processed.
-///   Performs the cross-correlation operator when `flip` is `false` and the convolution
-///   operator otherwise.
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:convolution>
-/// - ``IntOrArray``
-/// - ``conv2d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,(Int,Int),IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
-public func convGeneral(
-    _ array: MLXArray, _ weight: MLXArray, strides: IntOrArray = 1, padding: (Int, Int),
-    kernelDilation: IntOrArray = 1, inputDilation: IntOrArray = 1, groups: Int = 1,
-    flip: Bool = false,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_conv_general(
-        &result,
-        array.ctx, weight.ctx,
-        strides.asInt32Array, strides.count,
-        [padding.0.int32], 1,
-        [padding.1.int32], 1,
-        kernelDilation.asInt32Array, kernelDilation.count,
-        inputDilation.asInt32Array, inputDilation.count,
-        groups.int32, flip, stream.ctx)
-    return MLXArray(result)
-}
-
-/// 1D transposed convolution over an input with several channels.
-///
-/// > Only the default `groups=1` is currently supported.
-///
-/// - Parameters:
-///     - array: input array of shape `[N, H, C_in]`
-///     - weight: weight array of shape `[C_out, H, C_in]`
-///     - stride: kernel stride
-///     - padding: input padding
-///     - dilation: kernel dilation
-///     - outputPadding: output padding
-///     - groups: input feature groups
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:convolution>
-/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``convTransposed2d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
-/// - ``convTransposed3d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
-/// - ``convolve(_:_:mode:stream:)``
-public func convTransposed1d(
-    _ array: MLXArray, _ weight: MLXArray, stride: Int = 1, padding: Int = 0,
-    dilation: Int = 1, outputPadding: Int = 0, groups: Int = 1,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_conv_transpose1d(
-        &result,
-        array.ctx, weight.ctx, stride.int32, padding.int32,
-        dilation.int32, outputPadding.int32, groups.int32,
-        stream.ctx)
-    return MLXArray(result)
-}
-
-/// 2D transposed convolution over an input with several channels.
-///
-/// > Only the default `groups=1` is currently supported.
-///
-/// The numeric parameters may be given as single values:
-///
-/// ```swift
-/// padding: 1
-/// ```
-///
-/// This will produce a padding of `(1, 1)`.  You can also give an array:
-///
-/// ```swift
-/// padding: [2, 3]
-/// ```
-///
-/// See ``IntOrPair`` for more information.
-///
-/// - Parameters:
-///     - array: input array of shape `[N, H, W, C_in]`
-///     - weight: weight array of shape `[C_out, H, W, C_in]`
-///     - stride: kernel stride
-///     - padding: input padding
-///     - dilation: kernel dilation
-///     - outputPadding: output padding
-///     - groups: input feature groups
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:convolution>
-/// - ``IntOrPair``
-/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``convTransposed1d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
-/// - ``convTransposed3d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
-/// - ``convolve(_:_:mode:stream:)``
-/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,IntOrArray,IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
-public func convTransposed2d(
-    _ array: MLXArray, _ weight: MLXArray, stride: IntOrPair = 1, padding: IntOrPair = 0,
-    dilation: IntOrPair = 1, outputPadding: IntOrPair = 0, groups: Int = 1,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_conv_transpose2d(
-        &result,
-        array.ctx, weight.ctx, stride.first.int32, stride.second.int32, padding.first.int32,
-        padding.second.int32, dilation.first.int32, dilation.second.int32,
-        outputPadding.first.int32, outputPadding.second.int32, groups.int32,
-        stream.ctx)
-    return MLXArray(result)
-}
-
-/// 3D transposed convolution over an input with several channels.
-///
-/// > Only the default `groups=1` is currently supported.
-///
-/// The numeric parameters may be given as single values:
-///
-/// ```swift
-/// padding: 1
-/// ```
-///
-/// This will produce a padding of `(1, 1, 1)`.  You can also give an array:
-///
-/// ```swift
-/// padding: [2, 3, 3]
-/// ```
-///
-/// See ``IntOrTriple`` for more information.
-///
-/// - Parameters:
-///     - array: input array of shape `[N, D, H, W, C_in]`
-///     - weight: weight array of shape `[C_out, D, H, W, C_in]`
-///     - stride: kernel stride
-///     - padding: input padding
-///     - dilation: kernel dilation
-///     - outputPadding: output padding
-///     - groups: input feature groups
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:convolution>
-/// - ``IntOrTriple``
-/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``convTransposed1d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
-/// - ``convTransposed3d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
-/// - ``convolve(_:_:mode:stream:)``
-/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,IntOrArray,IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
-public func convTransposed3d(
-    _ array: MLXArray, _ weight: MLXArray, stride: IntOrTriple = 1, padding: IntOrTriple = 0,
-    dilation: IntOrTriple = 1, outputPadding: IntOrTriple = 0, groups: Int = 1,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_conv_transpose3d(
-        &result,
-        array.ctx, weight.ctx,
-        stride.first.int32, stride.second.int32, stride.third.int32,
-        padding.first.int32, padding.second.int32, padding.third.int32,
-        dilation.first.int32, dilation.second.int32, dilation.third.int32,
-        outputPadding.first.int32, outputPadding.second.int32, outputPadding.third.int32,
-        groups.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Mode for ``convolve(_:_:mode:stream:)``
-public enum ConvolveMode: Sendable {
-    case full
-    case valid
-    case same
-}
-
-/// The discrete convolution of 1D arrays.
-///
-/// - Parameters:
-///     - a: 1D input array
-///     - b: 1D input array
-///     - mode: padding mode
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:convolution>
-/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
-/// - ``conv2d(_:_:stride:padding:dilation:groups:stream:)``
-public func convolve(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, mode: ConvolveMode = .full,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-
-    precondition(a.ndim == 1, "inputs must be 1d (a)")
-    precondition(b.ndim == 1, "inputs must be 1d (b)")
-
-    var (input, weight) = a.size < b.size ? (b, a) : (a, b)
-
-    var slice = mlx_array_new()
-    mlx_slice(
-        &slice,
-        weight.ctx, [weight.dim(0) - 1].asInt32, 1, [-weight.dim(0) - 1].asInt32, 1, [-1], 1,
-        stream.ctx)
-    weight = MLXArray(slice)
-
-    weight = weight.reshaped([1, -1, 1], stream: stream)
-    input = input.reshaped([1, -1, 1], stream: stream)
-
-    let weightSize = weight.size
-    var padding = 0
-
-    switch mode {
-    case .full:
-        padding = weightSize - 1
-    case .valid:
-        padding = 0
-    case .same:
-        if weightSize % 2 == 1 {
-            padding = weightSize / 2
-        } else {
-            let padLeft = weightSize / 2
-            let padRight = max(0, padLeft / 2 - 1)
-
-            input = padded(input, widths: [0, [padLeft, padRight], 0], stream: stream)
-        }
-    }
-
-    var result = mlx_array_new()
-    mlx_conv1d(&result, input.ctx, weight.ctx, 1, padding.int32, 1, 1, stream.ctx)
-    return MLXArray(result).reshaped(-1, stream: stream)
-}
-
-/// Element-wise hyperbolic cosine.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``cos(_:stream:)``
-public func cosh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_cosh(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Convert angles from radians to degrees.
-///
-/// - Parameters:
-///   - array: input array
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``radians(_:stream:)``
-public func degrees(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_degrees(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Insert dependencies between arrays in the graph. The outputs are
-/// identical to `input` but with dependencies on `dependencies`.
-///
-/// - Parameters:
-///   - input: input array
-///   - dependencies: arrays to depend on
-/// - Returns: output which depends on the `dependencies`
-///
-/// ### See Also
-/// - ``depends(inputs:dependencies:)``
-public func depends(input: MLXArray, dependencies: [MLXArray]) -> MLXArray {
-    var result = mlx_vector_array_new()
-    defer { mlx_vector_array_free(result) }
-    let inputs = new_mlx_vector_array([input])
-    defer { mlx_vector_array_free(inputs) }
-    let dependencies = new_mlx_vector_array(dependencies)
-    defer { mlx_vector_array_free(dependencies) }
-    mlx_depends(&result, inputs, dependencies)
-
-    let arrays = mlx_vector_array_values(result)
-    return arrays[0]
-}
-
-/// Insert dependencies between arrays in the graph. The outputs are
-/// identical to `inputs` but with dependencies on `dependencies`.
-///
-/// - Parameters:
-///   - inputs: input arrays
-///   - dependencies: arrays to depend on
-/// - Returns: outputs which depends on the `dependencies`
-///
-/// ### See Also
-/// - ``depends(input:dependencies:)``
-public func depends(inputs: [MLXArray], dependencies: [MLXArray]) -> [MLXArray] {
-    var result = mlx_vector_array_new()
-    defer { mlx_vector_array_free(result) }
-    let inputs = new_mlx_vector_array(inputs)
-    defer { mlx_vector_array_free(inputs) }
-    let dependencies = new_mlx_vector_array(dependencies)
-    defer { mlx_vector_array_free(dependencies) }
-    mlx_depends(&result, inputs, dependencies)
-
-    return mlx_vector_array_values(result)
-}
-
-/// Quantization modes for weight compression in neural networks.
-///
-/// Quantization reduces the precision of model weights to decrease memory usage and
-/// potentially improve inference speed. Different modes use different strategies for
-/// mapping full-precision values to lower-precision representations.
-public enum QuantizationMode: String, Codable, Sendable {
-    /// Affine (linear) quantization with scale and bias parameters.
-    ///
-    /// This is the standard quantization approach where values are quantized using:
-    /// ```
-    /// quantized_value = round((value - bias) / scale)
-    /// dequantized_value = quantized_value * scale + bias
-    /// ```
-    ///
-    /// The `scale` and `bias` parameters are computed per group of elements (typically 32 or 64 elements)
-    /// to minimize quantization error. This mode provides good compression with reasonable accuracy preservation
-    /// for most neural network weights.
-    case affine
-
-    /// MX (Microscaling) FP4 quantization format.
-    ///
-    /// ### See Also
-    /// - https://www.opencompute.org/documents/ocp-microscaling-formats-mx-v1-0-spec-final-pdf
-    case mxfp4
-
-    /// MX (Microscaling) FP8 quantization format.
-    ///
-    /// ### See Also
-    /// - https://www.opencompute.org/documents/ocp-microscaling-formats-mx-v1-0-spec-final-pdf
-    case mxfp8
-
-    case nvfp4
-}
-
-/// Dequantize the matrix `w` using the provided `scales` and
-/// `biases` and the `group_size` and `bits` configuration.
-///
-/// For details, please see
-/// [this documentation](https://ml-explore.github.io/mlx/build/html/python/_autosummary/mlx.core.dequantize.html)
-///
-/// - Parameters:
-///   - w: The quantized weight matrix to dequantize
-///   - scales: Scaling factors used during quantization. Should have shape compatible with the quantized groups
-///   - biases: Bias values used during quantization. Should have shape compatible with the quantized groups
-///   - groupSize: The size of each quantization group. Elements are quantized in groups of this size. Default is 64
-///   - bits: The number of bits used per quantized element. Default is 4
-///   - mode: The quantization mode used. Either `.affine` for standard affine quantization or `.mxfp4` for MXFP4 format. Default is `.affine`
-///   - globalScale: The per-input float32 scale used for  ``QuantizationMode/nvfp4``
-///   - dtype: data type of the output.  If not specified it will be inferred from the scales and biases.
-///   - stream: Stream or device to evaluate on
-///
-/// ### See Also
-/// - ``quantized(_:groupSize:bits:mode:globalScale:stream:)``
-/// - ``quantizedMM(_:_:scales:biases:transpose:groupSize:bits:mode:stream:)``
-public func dequantized(
-    _ w: MLXArray,
-    scales: MLXArray, biases: MLXArray?,
-    groupSize: Int? = nil, bits: Int? = nil, mode: QuantizationMode = .affine,
-    globalScale: MLXArray? = nil,
-    dtype: DType? = nil,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    let gs = mlx_optional_int(value: Int32(groupSize ?? 0), has_value: groupSize != nil)
-    let bits = mlx_optional_int(value: Int32(bits ?? 0), has_value: bits != nil)
-    let dtype = mlx_optional_dtype(value: dtype?.cmlxDtype ?? MLX_FLOAT16, has_value: dtype != nil)
-    mlx_dequantize(
-        &result, w.ctx,
-        scales.ctx, (biases ?? .mlxNone).ctx, gs, bits, mode.rawValue,
-        (globalScale ?? .mlxNone).ctx,
-        dtype,
-        stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise division.
-///
-/// Divide two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = MLXArray([4, 5, 6])
-///
-/// let r = a / b / 7
-/// ```
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``divmod(_:_:stream:)``
-public func divide(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_divide(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise quotient and remainder.
-///
-/// The fuction `divmod(a, b)` is equivalent to but faster than
-/// `(a // b, a % b)`. The function uses numpy-style broadcasting
-/// semantics. Either or both input arrays can also be scalars.
-///
-/// - Parameters:
-///   - a: input array or scalar
-///   - b: input array or scalar
-///   - stream: stream or device to evaluate on
-/// - Returns: The quotient `a / b` and remainder `a % b`
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``divide(_:_:stream:)``
-/// - ``remainder(_:_:stream:)``
-public func divmod(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> (MLXArray, MLXArray) {
-    let (a, b) = toArrays(a, b)
-    var vec = mlx_vector_array_new()
-    mlx_divmod(&vec, a.ctx, b.ctx, stream.ctx)
-    defer { mlx_vector_array_free(vec) }
-    let result = mlx_vector_array_values(vec)
-    return (result[0], result[1])
-}
-
-/// Perform the Einstein summation convention on the operands.
-///
-/// - Parameters:
-///   - subscripts: Einstein summation convention equation
-///   - operands: input arrays
-///   - stream: stream or device to evaluate on
-public func einsum(_ subscripts: String, _ operands: MLXArray..., stream: StreamOrDevice = .default)
-    -> MLXArray
-{
-    einsum(subscripts, operands: operands, stream: stream)
-}
-
-/// Perform the Einstein summation convention on the operands.
-///
-/// - Parameters:
-///   - subscripts: Einstein summation convention equation
-///   - operands: input arrays
-///   - stream: stream or device to evaluate on
-public func einsum(
-    _ subscripts: String, operands: some Collection<MLXArray>, stream: StreamOrDevice = .default
-)
-    -> MLXArray
-{
-    let operands = new_mlx_vector_array(operands)
-    defer { mlx_vector_array_free(operands) }
-
-    var result = mlx_array_new()
-    mlx_einsum(&result, subscripts, operands, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise equality.
-///
-/// Equality comparison on two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = a + 1
-///
-/// if (a .== b).all().item() {
-///     ...
-/// }
-/// ```
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:logical>
-public func equal(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_equal(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise error function.
-///
-/// For details, please see
-/// [this documentation](https://ml-explore.github.io/mlx/build/html/python/_autosummary/mlx.core.erf.html)
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``erfInverse(_:stream:)``
-public func erf(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_erf(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise inverse of ``erf(_:stream:)``.
-///
-/// For details, please see
-/// [this documentation](https://ml-explore.github.io/mlx/build/html/python/_autosummary/mlx.core.erf.html)
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``erf(_:stream:)``
-public func erfInverse(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_erfinv(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Add a size one dimension at the given axis.
-///
-/// - Parameters:
-///     - array: input array
-///     - axes: indexes of the inserted dimensions
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:shapes>
-/// - ``expandedDimensions(_:axis:stream:)``
-public func expandedDimensions(
-    _ array: MLXArray, axes: some Collection<Int>, stream: StreamOrDevice = .default
-)
-    -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_expand_dims_axes(&result, array.ctx, axes.asInt32, axes.count, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Add a size one dimension at the given axis.
-///
-/// - Parameters:
-///     - array: input array
-///     - axis: index of the inserted dimension
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:shapes>
-/// - ``expandedDimensions(_:axes:stream:)``
-public func expandedDimensions(_ array: MLXArray, axis: Int, stream: StreamOrDevice = .default)
-    -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_expand_dims_axes(&result, array.ctx, [axis.int32], 1, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise exponential minus 1.
-///
-/// Computes `exp(x) - 1` with greater precision for small `x`.
-///
-/// - Parameters:
-///   - array: input array
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``exp(_:stream:)``
-public func expm1(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_expm1(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-@available(*, deprecated, renamed: "gatherMM(_:_:lhsIndices:rhsIndices:sortedIndices:stream:)")
-public func gatherMatmul(
-    _ a: MLXArray, _ b: MLXArray, lhsIndices: MLXArray? = nil, rhsIndices: MLXArray? = nil,
-    sortedIndices: Bool = false, stream: StreamOrDevice = .default
-) -> MLXArray {
-    gatherMM(
-        a, b,
-        lhsIndices: lhsIndices, rhsIndices: rhsIndices,
-        sortedIndices: sortedIndices,
-        stream: stream)
-}
-
-/// Matrix multiplication with matrix-level gather.
-///
-/// Performs a gather of the operands with the given indices followed by a
-/// (possibly batched) matrix multiplication of two arrays.  This operation
-/// is more efficient than explicitly applying a `take` followed by a
-/// `matmul`.
-///
-/// The indices `lhsIndices` and `rhsIndices` contain flat indices
-/// along the batch dimensions (i.e. all but the last two dimensions) of
-/// `a` and `b` respectively.
-///
-/// For `a` with shape `(A1, A2, ..., AS, M, K)`, `lhsIndices`
-/// contains indices from the range `[0, A1 * A2 * ... * AS)`
-///
-/// For `b` with shape `(B1, B2, ..., BS, M, K)`, `rhsIndices`
-/// contains indices from the range `[0, B1 * B2 * ... * BS)`
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``matmul(_:_:stream:)``
-public func gatherMM(
-    _ a: MLXArray, _ b: MLXArray, lhsIndices: MLXArray? = nil, rhsIndices: MLXArray? = nil,
-    sortedIndices: Bool = false, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-
-    mlx_gather_mm(
-        &result, a.ctx, b.ctx, (lhsIndices ?? .mlxNone).ctx, (rhsIndices ?? .mlxNone).ctx,
-        sortedIndices, stream.ctx)
-
-    return MLXArray(result)
-}
-
-@available(
-    *, deprecated,
-    renamed:
-        "gatherQuantizedMM(_:_:scales:biases:lhsIndices:rhsIndices:transpose:groupSize:bits:mode:sortedIndices:stream:)"
-)
-public func gatherQuantizedMatmul(
-    _ x: MLXArray, _ w: MLXArray, scales: MLXArray, biases: MLXArray?,
-    lhsIndices: MLXArray? = nil, rhsIndices: MLXArray? = nil,
-    transpose: Bool = true, groupSize: Int? = nil, bits: Int? = nil,
-    mode: QuantizationMode = .affine,
-    sortedIndices: Bool = false,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    gatherQuantizedMM(
-        x, w, scales: scales, biases: biases,
-        lhsIndices: lhsIndices, rhsIndices: rhsIndices,
-        transpose: transpose,
-        groupSize: groupSize, bits: bits, mode: mode,
-        sortedIndices: sortedIndices,
-        stream: stream)
-}
-
-/// Perform quantized matrix multiplication with matrix-level gather.
-///
-/// This operation is the quantized equivalent to ``gatherMM(_:_:lhsIndices:rhsIndices:sortedIndices:stream:)``
-///
-/// Note that `scales` and `biases` must have the same batch dimensions
-/// as `w` since they represent the same quantized matrix.
-///
-/// - Parameters:
-///   - x: The input matrix
-///   - w: The quantized weight matrix to be used in the matrix multiplication
-///   - scales: The scales to use per `groupSize` elements of `w`
-///   - biases: The biases to use per `groupSize` elements of `w`
-///   - lhsIndices: Optional indices for gathering from the left-hand side matrix
-///   - rhsIndices: Optional indices for gathering from the right-hand side matrix
-///   - transpose: Whether to transpose the weight matrix `w`. Default is `true`
-///   - groupSize: The size of the group in `w` that shares a scale and bias. Default is `64`
-///   - bits: The number of bits occupied by each element in `w`. Default is `4`
-///   - mode: The quantization mode. Default is `.affine`
-///   - sortedIndices: Whether the indices are sorted. Default is `false`
-///   - stream: Stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``quantizedMM(_:_:scales:biases:transpose:groupSize:bits:mode:stream:)``
-public func gatherQuantizedMM(
-    _ x: MLXArray, _ w: MLXArray, scales: MLXArray, biases: MLXArray?,
-    lhsIndices: MLXArray? = nil, rhsIndices: MLXArray? = nil,
-    transpose: Bool = true, groupSize: Int? = nil, bits: Int? = nil,
-    mode: QuantizationMode = .affine,
-    sortedIndices: Bool = false,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-
-    let gs = mlx_optional_int(value: Int32(groupSize ?? 0), has_value: groupSize != nil)
-    let bits = mlx_optional_int(value: Int32(bits ?? 0), has_value: bits != nil)
-
-    mlx_gather_qmm(
-        &result,
-        x.ctx, w.ctx, scales.ctx, (biases ?? .mlxNone).ctx, (lhsIndices ?? .mlxNone).ctx,
-        (rhsIndices ?? .mlxNone).ctx, transpose,
-        gs, bits, mode.rawValue, sortedIndices,
-        stream.ctx)
-
-    return MLXArray(result)
-}
-
-/// Element-wise greater than.
-///
-/// Greater than on two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = a + 1
-///
-/// if (a .> b).all().item() {
-///     ...
-/// }
-/// ```
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:logical>
-public func greater(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_greater(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise less greater than or equal.
-///
-/// Greater than or equal on two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = a + 1
-///
-/// if (a .>= b).all().item() {
-///     ...
-/// }
-/// ```
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:logical>
-public func greaterEqual(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_greater_equal(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Perform the Walsh-Hadamard transform along the final axis.
-///
-/// Supports sizes `n = m*2^k` for `m` in `(1, 12, 20, 28)` and `2^k <= 8192`
-/// for ``DType/float32`` and `2^k <= 16384` for ``DType/float16`` and ``DType/bfloat16``.
-///
-/// - Parameters:
-///   - array: input array
-///   - scale: scale the output by this factor -- default is `1.0/sqrt(array.dim(-1))`
-///   - stream: stream to evaluate on
-public func hadamardTransform(
-    _ array: MLXArray, scale: Float? = nil, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let scale = mlx_optional_float(value: scale ?? 0, has_value: scale != nil)
-    var result = mlx_array_new()
-    mlx_hadamard_transform(&result, array.ctx, scale, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Return the Hamming window.
-///
-/// The Hamming window is a taper formed by using a weighted cosine.
-///
-/// - Parameters:
-///   - m: number of points in the output window
-///   - stream: stream to evaluate on
-/// - Returns: The window, with the maximum value normalized to one (the value one appears only if
-///     the number of samples is odd).
-public func hamming(
-    _ m: Int, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_hamming(&result, Int32(m), stream.ctx)
-    return MLXArray(result)
-}
-
-/// Return the Hanning window.
-///
-/// The Hanning window is a taper formed by using a weighted cosine.
-///
-/// - Parameters:
-///   - m: number of points in the output window
-///   - stream: stream to evaluate on
-/// - Returns: The window, with the maximum value normalized to one (the value one appears only if
-///     the number of samples is odd).
-public func hanning(
-    _ m: Int, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_hanning(&result, Int32(m), stream.ctx)
-    return MLXArray(result)
-}
-
-/// Ordinary inner product of vectors for 1-D arrays, in higher dimensions a sum product over the last axes.
-///
-/// - Parameters:
-///   - a: input array
-///   - b: input array
-///   - stream: stream or device to evaluate on
-/// - Returns: inner product
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func inner(
-    _ a: MLXArray, _ b: MLXArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_inner(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Returns a boolean array where two arrays are element-wise equal within a tolerance.
-///
-/// Infinite values are considered equal if they have the same sign, NaN values are not equal unless
-/// `equalNAN` is `true`.
-///
-/// Two values are considered close if:
-///
-/// ```swift
-/// abs(a - b) <= (atol + rtol * abs(b))
-/// ```
-///
-/// Unlike ``arrayEqual(_:_:equalNAN:stream:)`` this function supports <doc:broadcasting>.
-///
-/// - Parameters:
-///   - a: input array
-///   - b: input array
-///   - rtol: relative tolerance (see discussion)
-///   - atol: absolute tolerance (see discussion)
-///   - equalNaN: if `true` treat NaN values as equal to each other
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - ``allClose(_:_:rtol:atol:equalNaN:stream:)``
-/// - ``arrayEqual(_:_:equalNAN:stream:)``
-public func isClose(
-    _ a: MLXArray, _ b: MLXArray, rtol: Double = 1e-5, atol: Double = 1e-8, equalNaN: Bool = false,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_isclose(&result, a.ctx, b.ctx, rtol, atol, equalNaN, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Return a boolean array indicating which elements are NaN.
-///
-/// - Parameters:
-///   - array: input array
-///   - stream: stream or device to evaluate on
-/// - Returns: The boolean array indicating which elements are NaN.
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func isNaN(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_isnan(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Return a boolean array indicating which elements are infinity.
-///
-/// - Parameters:
-///   - array: input array
-///   - stream: stream or device to evaluate on
-/// - Returns: The boolean array indicating which elements are infinity.
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func isInf(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_isinf(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Return a boolean array indicating which elements are finite.
-///
-/// - Parameters:
-///   - array: input array
-///   - stream: stream or device to evaluate on
-/// - Returns: The boolean array indicating which elements are infinity.
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func isFinite(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_isfinite(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Return a boolean array indicating which elements are negative infinity.
-///
-/// - Parameters:
-///   - array: input array
-///   - stream: stream or device to evaluate on
-/// - Returns: The boolean array indicating which elements are negative infinity.
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func isNegInf(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_isneginf(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Return a boolean array indicating which elements are positive infinity.
-///
-/// - Parameters:
-///   - array: input array
-///   - stream: stream or device to evaluate on
-/// - Returns: The boolean array indicating which elements are positive infinity.
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func isPosInf(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_isposinf(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise less than.
-///
-/// Less than on two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = a + 1
-///
-/// if (a .< b).all().item() {
-///     ...
-/// }
-/// ```
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:logical>
-public func less(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_less(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise less than or equal.
-///
-/// Less than or equal on two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = a + 1
-///
-/// if (a .<= b).all().item() {
-///     ...
-/// }
-/// ```
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:logical>
-public func lessEqual(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_less_equal(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise log-add-exp.
-///
-/// This is a numerically stable log-add-exp of two arrays with numpy-style
-/// broadcasting semantics. Either or both input arrays can also be scalars.
-///
-/// The computation is is a numerically stable version of `log(exp(a) + exp(b))`.
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func logAddExp(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_logaddexp(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise logical and.
-///
-/// Logical and on two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = a + 1
-///
-/// // equivalent
-/// let r = (a .< b) .&& ((a + 1) .> b)
-/// let r2 = logicalAnd((a .< b), ((a + 1) .> b))
-/// ```
-///
-/// - Parameters:
-///   - a: input array or scalar
-///   - b: input array or scalar
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - <doc:logical>
-/// - ``MLXArray/.&&(_:_:)``
-public func logicalAnd(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_logical_and(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise logical not.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = a + 1
-/// let r = !(a == b)
-/// ```
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - <doc:logical>
-public func logicalNot(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_logical_not(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise logical or.
-///
-/// Logical or on two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = a + 1
-///
-/// // equivalent
-/// let r = (a .< b) .|| ((a + 1) .> b)
-/// let r2 = logicalOr((a .< b), ((a + 1) .> b))
-/// ```
-///
-/// - Parameters:
-///   - a: input array or scalar
-///   - b: input array or scalar
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - <doc:logical>
-/// - ``MLXArray/.||(_:_:)``
-public func logicalOr(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_logical_or(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Indexing mode for ``meshGrid(_:sparse:indexing:stream:)``.
-public enum MeshGridIndexing: String, Sendable {
-    /// cartesian indexing
-    case xy
-
-    /// matrix indexing
-    case ij
-}
-
-/// Generate multidimensional coordinate grids from 1-D coordinate arrays
-///
-/// - Parameters:
-///   - arrays: input arrays
-///   - sparse: if `true` a sparse grid is returned in which each output array has a single
-///     non-zero element, otherwise a dense grid is returned.
-///   - indexing: indexing mode
-///   - stream: stream or device to evaluate on
-public func meshGrid(
-    _ arrays: some Collection<MLXArray>, sparse: Bool = false, indexing: MeshGridIndexing = .xy,
-    stream: StreamOrDevice = .default
-) -> [MLXArray] {
-    let mlxArrays = new_mlx_vector_array(arrays)
-    defer { mlx_vector_array_free(mlxArrays) }
-
-    var vec = mlx_vector_array_new()
-
-    mlx_meshgrid(&vec, mlxArrays, sparse, indexing.rawValue.cString(using: .utf8), stream.ctx)
-    defer { mlx_vector_array_free(vec) }
-
-    return mlx_vector_array_values(vec)
-}
-
-/// Element-wise maximum.
-///
-/// Take the element-wise max of two arrays with <doc:broadcasting>
-/// semantics.
-///
-/// - Parameters:
-///     - a: the first array
-///     - b: the second array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``minimum(_:_:stream:)``
-public func maximum(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_maximum(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Compute the median(s) over the given axis.
-///
-/// - Parameters:
-///     - a: the first array
-///     - axis: axis to reduce over
-///     - keepDims: if `true` keep reduced axis as singleton dimension
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:reduction>
-public func median(
-    _ a: MLXArray, axis: Int, keepDims: Bool = false,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_median(&result, a.ctx, [axis.int32], 1, keepDims, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Compute the median(s) over the given axes.
-///
-/// - Parameters:
-///     - a: the first array
-///     - axes: axes to reduce over
-///     - keepDims: if `true` keep reduced axis as singleton dimension
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:reduction>
-public func median(
-    _ a: MLXArray, axes: [Int], keepDims: Bool = false,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_median(&result, a.ctx, axes.asInt32, axes.count, keepDims, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Compute the median(s) over the full array.
-///
-/// - Parameters:
-///     - a: the first array
-///     - keepDims: if `true` keep reduced axis as singleton dimension
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:reduction>
-public func median(
-    _ a: MLXArray, keepDims: Bool = false,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_median(&result, a.ctx, nil, 0, keepDims, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise minimum.
-///
-/// Take the element-wise min of two arrays with <doc:broadcasting>
-/// semantics.
-///
-/// - Parameters:
-///     - a: the first array
-///     - b: the second array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``maximum(_:_:stream:)``
-public func minimum(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_minimum(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise multiplication.
-///
-/// Multiply two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = MLXArray([4, 5, 6])
-///
-/// let r = a * b * 7
-/// ```
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func multiply(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_multiply(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Replace NaN and Inf values with finite numbers.
-///
-/// - Parameters:
-///   - array: input array
-///   - nan: value to replace NaN with
-///   - posInf: value to replace positive inifinites with.  If not specified will use
-///     the largest finite value for the given dtype.
-///   - negInf: value to replace negative inifinites with.  If not specified will use
-///     the negative of the largest finite value for the given dtype.
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func nanToNum(
-    _ array: MLXArray,
-    nan: Float = 0, posInf: Float? = 0, negInf: Float? = 0,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    let posInf = mlx_optional_float(value: posInf ?? 0, has_value: posInf != nil)
-    let negInf = mlx_optional_float(value: negInf ?? 0, has_value: negInf != nil)
-    var result = mlx_array_new()
-    mlx_nan_to_num(&result, array.ctx, nan, posInf, negInf, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise negation.
-///
-/// Negate the values in the array.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let r = negative(a) // e.g. -a
-/// ```
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func negative(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_negative(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise not equal.
-///
-/// Not equal on two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = a + 1
-///
-/// // equivalent to if (a .!= b).all().item() {
-/// if notEqual(a, b).all().item() {
-///     ...
-/// }
-/// ```
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:logical>
-public func notEqual(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_not_equal(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Compute the outer product of two 1-D arrays, if the array's passed are not 1-D a flatten op will be run beforehand.
-///
-/// - Parameters:
-///   - a: input array
-///   - b: input array
-///   - stream: stream or device to evaluate on
-/// - Returns: outer product
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func outer(
-    _ a: MLXArray, _ b: MLXArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_outer(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Mode for ``padded(_:width:mode:value:stream:)``
-public enum PadMode: String {
-    /// pads with constant value
-    case constant
-    /// pads with the edge values of the array
-    case edge
-}
-
-/// Pad an array with a constant value.
-///
-/// - Parameters:
-///     - array: the array to pad
-///     - width: either an `Int` number of values to pad before AND after each axis or an array of 2 giving the
-///             before and after counts
-///     - mode: padding mode, see ``PadMode``
-///     - value: constant value to pad the edges with
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:shapes>
-/// - ``padded(_:widths:mode:value:stream:)``
-public func padded(
-    _ array: MLXArray, width: IntOrPair, mode: PadMode = .constant, value: MLXArray? = nil,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    let ndim = array.ndim
-    let axes = Array(Int32(0) ..< Int32(ndim))
-    let lowPads = (0 ..< ndim).map { _ in width.first.int32 }
-    let highPads = (0 ..< ndim).map { _ in width.second.int32 }
-    let value = value ?? MLXArray(0, dtype: array.dtype)
-
-    var result = mlx_array_new()
-    mlx_pad(
-        &result,
-        array.ctx, axes, ndim, lowPads, ndim, highPads, ndim, value.ctx,
-        mode.rawValue.cString(using: .utf8), stream.ctx)
-    return MLXArray(result)
-}
-
-/// Pad an array with a constant value.
-///
-/// - Parameters:
-///     - array: the array to pad
-///     - widths: array of int or pairs giving the before/after amounts for each axis
-///     - mode: padding mode, see ``PadMode``
-///     - value: constant value to pad the edges with
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:shapes>
-/// - ``padded(_:width:mode:value:stream:)``
-public func padded(
-    _ array: MLXArray, widths: some Collection<IntOrPair>, mode: PadMode = .constant,
-    value: MLXArray? = nil,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    let ndim = array.ndim
-    let axes = Array(Int32(0) ..< Int32(ndim))
-    let lowPads = widths.map { $0.first.int32 }
-    let highPads = widths.map { $0.second.int32 }
-    let value = value ?? MLXArray(0, dtype: array.dtype)
-
-    var result = mlx_array_new()
-    mlx_pad(
-        &result,
-        array.ctx, axes, ndim, lowPads, ndim, highPads, ndim, value.ctx,
-        mode.rawValue.cString(using: .utf8), stream.ctx)
-    return MLXArray(result)
-}
-
-/// Returns a partitioned copy of the array such that the smaller `kth`
-/// elements are first.
-///
-/// The ordering of the elements in partitions is undefined.
-///
-/// - Parameters:
-///     - array: input array
-///     - kth: Element at the `kth` index will be in its sorted
-///                   position in the output. All elements before the kth index will
-///                   be less or equal to the `kth` element and all elements after
-///                   will be greater or equal to the `kth` element in the output.
-///     - axis: axis to partition over
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:sorting>
-/// - ``partitioned(_:kth:stream:)``
-/// - ``argPartition(_:kth:axis:stream:)``
-public func partitioned(_ array: MLXArray, kth: Int, axis: Int, stream: StreamOrDevice = .default)
-    -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_partition_axis(&result, array.ctx, kth.int32, axis.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-///
-/// Returns a partitioned copy of the flattened array such that the smaller `kth`
-/// elements are first.
-///
-/// The ordering of the elements in partitions is undefined.
-///
-/// - Parameters:
-///     - array: input array
-///     - kth: Element at the `kth` index will be in its sorted
-///                   position in the output. All elements before the kth index will
-///                   be less or equal to the `kth` element and all elements after
-///                   will be greater or equal to the `kth` element in the output.
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:sorting>
-/// - ``partitioned(_:kth:axis:stream:)``
-/// - ``argPartition(_:kth:axis:stream:)``
-public func partitioned(_ array: MLXArray, kth: Int, stream: StreamOrDevice = .default) -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_partition(&result, array.ctx, kth.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Put values along an axis at the specified indices.
-///
-/// - Parameters:
-///     - array: destination array
-///     - indices: Indices array. These should be broadcastable with the input array excluding the `axis` dimension.
-///     - values: Values array. These should be broadcastable with the indices.
-///     - axis: Axis in the destination to put the values to
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:indexes>
-/// - ``takeAlong(_:_:stream:)``
-public func putAlong(
-    _ array: MLXArray, _ indices: MLXArray, values: MLXArray, axis: Int,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_put_along_axis(&result, array.ctx, indices.ctx, values.ctx, axis.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Put values along an axis at the specified indices in a flattened array.
-///
-/// - Parameters:
-///     - array: destination array
-///     - indices: Indices array. These should be broadcastable with the flattened input array
-///     - values: Values array. These should be broadcastable with the flattened input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:indexes>
-/// - ``takeAlong(_:_:axis:stream:)
-public func putAlong(
-    _ array: MLXArray, _ indices: MLXArray, values: MLXArray, stream: StreamOrDevice = .default
-)
-    -> MLXArray
-{
-    let input = array.reshaped([-1], stream: stream)
-    var result = mlx_array_new()
-    mlx_put_along_axis(&result, input.ctx, indices.ctx, values.ctx, 0, stream.ctx)
-    return MLXArray(result).reshaped(array.shape, stream: stream)
-}
-
-/// Quantize the matrix `w` using `bits` bits per element.
-///
-/// Note, every `group_size` elements in a row of `w` are quantized
-/// together. Hence, number of columns of `w` should be divisible by
-/// `group_size`. In particular, the rows of `w` are divided into groups of
-/// size `group_size` which are quantized together.
-///
-/// > `quantized` currently only supports 2D inputs with dimensions which are multiples of 32
-///
-/// - Parameters:
-///   - w: Matrix to be quantized
-///   - groupSize: The size of the group in `w` that shares a scale and bias. Default is `64`
-///   - bits: The number of bits occupied by each element of `w` in the returned quantized matrix. Default is `4`
-///   - mode: The quantization mode. Default is `.affine`
-///   - globalScale: The per-input float32 scale used for  ``QuantizationMode/nvfp4``
-///   - stream: Stream or device to evaluate on
-/// - Returns: A tuple containing the quantized weights (`wq`), scaling factors (`scales`), and bias values (`biases`).
-///     Note that `biases` may be nil in for some `mode`.
-///
-/// For details, please see
-/// [this documentation](https://ml-explore.github.io/mlx/build/html/python/_autosummary/mlx.core.quantize.html)
-///
-/// ### See Also
-/// - ``dequantized(_:scales:biases:groupSize:bits:mode:globalScale:dtype:stream:)``
-/// - ``quantizedMM(_:_:scales:biases:transpose:groupSize:bits:mode:stream:)``
-public func quantized(
-    _ w: MLXArray,
-    groupSize: Int? = nil, bits: Int? = nil,
-    mode: QuantizationMode = .affine,
-    globalScale: MLXArray? = nil,
-    stream: StreamOrDevice = .default
-) -> (wq: MLXArray, scales: MLXArray, biases: MLXArray?) {
-    var r = mlx_vector_array_new()
-    defer { mlx_vector_array_free(r) }
-
-    let gs = mlx_optional_int(value: Int32(groupSize ?? 0), has_value: groupSize != nil)
-    let bits = mlx_optional_int(value: Int32(bits ?? 0), has_value: bits != nil)
-
-    mlx_quantize(
-        &r, w.ctx, gs, bits, mode.rawValue,
-        (globalScale ?? .mlxNone).ctx,
-        stream.ctx)
-
-    let arrays = mlx_vector_array_values(r)
-    return (arrays[0], arrays[1], arrays.count > 2 ? arrays[2] : nil)
-}
-
-@available(
-    *, deprecated, renamed: "quantizedMM(_:_:scales:biases:transpose:groupSize:bits:mode:stream:)"
-)
-public func quantizedMatmul(
-    _ x: MLXArray, _ w: MLXArray, scales: MLXArray, biases: MLXArray?,
-    transpose: Bool = true,
-    groupSize: Int? = nil, bits: Int? = nil,
-    mode: QuantizationMode = .affine,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    quantizedMM(
-        x, w, scales: scales, biases: biases,
-        transpose: transpose,
-        groupSize: groupSize, bits: bits, mode: mode,
-        stream: stream)
-}
-
-/// Perform the matrix multiplication with the quantized matrix `w`. The
-/// quantization uses one floating point scale and bias per `group_size` of
-/// elements. Each element in `w` takes `bits` bits and is packed in an
-/// unsigned 32 bit integer.
-///
-/// - Parameters:
-///   - x: Input array
-///   - w: Quantized matrix packed in unsigned integers
-///   - scales: The scales to use per `groupSize` elements of `w`
-///   - biases: The biases to use per `groupSize` elements of `w`
-///   - transpose: Defines whether to multiply with the transposed `w` or not,
-///     namely whether we are performing `x @ w.T` or `x @ w`. Default is `true`
-///   - groupSize: The size of the group in `w` that shares a scale and bias. Default is `64`
-///   - bits: The number of bits occupied by each element in `w`. Default is `4`
-///   - mode: The quantization mode. Default is `.affine`
-///   - stream: Stream or device to evaluate on
-///
-/// ### See Also
-/// - ``dequantized(_:scales:biases:groupSize:bits:mode:globalScale:dtype:stream:)``
-/// - ``quantized(_:groupSize:bits:mode:globalScale:stream:)``
-public func quantizedMM(
-    _ x: MLXArray, _ w: MLXArray, scales: MLXArray, biases: MLXArray?,
-    transpose: Bool = true,
-    groupSize: Int? = nil, bits: Int? = nil,
-    mode: QuantizationMode = .affine,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-
-    let gs = mlx_optional_int(value: Int32(groupSize ?? 0), has_value: groupSize != nil)
-    let bits = mlx_optional_int(value: Int32(bits ?? 0), has_value: bits != nil)
-
-    mlx_quantized_matmul(
-        &result,
-        x.ctx, w.ctx, scales.ctx, (biases ?? .mlxNone).ctx,
-        transpose, gs, bits,
-        mode.rawValue,
-        stream.ctx
-    )
-    return MLXArray(result)
-}
-
-/// Perform a matrix multiplication using a possibly quantized weight matrix
-/// `w` and a non-quantized input `x`. The input `x` is quantized on the
-/// fly. The weight matrix `w` is used as-is if it is already quantized;
-/// otherwise, it is quantized on the fly.
-///
-/// If `w` is quantized, `scales` must be provided, and `groupSize`,
-/// `bits`, and `mode` must match the parameters that were used to quantize
-/// `w`.
-///
-/// Notes:
-/// - If `w` is expected to receive gradients, it must be provided in
-///   non-quantized form.
-///
-/// - If `x` and `w` are not quantized, their data types must be ``DType/float32``,
-///   ``DType/float16``, or ``DType/bfloat16``.
-///
-/// - If `w` is quantized, it must be packed in unsigned integers.
-///
-/// - Parameters:
-///   - x: input array
-///   - w: weight matrix.  If quantized, it is packed in unsigned integers.
-///   - scales: The scales to use per `groupSize` elements of `w` if `w` is quantized
-///   - groupSize: Number of elements in `x` and `w` that share a scale
-///   - bits: Number of bits used to represent each element of `x` and `w`
-///   - mode: The quantization mode. Default is `.affine`
-///   - globalScaleX: The per-input float32 scale used for `x` with  ``QuantizationMode/nvfp4``
-///   - globalScaleW: The per-input float32 scale used for  `w` with ``QuantizationMode/nvfp4``
-///   - stream: Stream or device to evaluate on
-public func quantizedQuantizedMM(
-    _ x: MLXArray, _ w: MLXArray, scales: MLXArray?,
-    groupSize: Int? = nil, bits: Int? = nil,
-    mode: QuantizationMode = .nvfp4,
-    globalScaleX: MLXArray? = nil,
-    globalScaleW: MLXArray? = nil,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-
-    let gs = mlx_optional_int(value: Int32(groupSize ?? 0), has_value: groupSize != nil)
-    let bits = mlx_optional_int(value: Int32(bits ?? 0), has_value: bits != nil)
-
-    mlx_qqmm(
-        &result,
-        x.ctx, w.ctx, (scales ?? .mlxNone).ctx,
-        gs, bits,
-        mode.rawValue,
-        (globalScaleX ?? .mlxNone).ctx,
-        (globalScaleW ?? .mlxNone).ctx,
-        stream.ctx
-    )
-    return MLXArray(result)
-}
-
-/// Convert angles from degrees to radians.
-///
-/// - Parameters:
-///   - array: input array
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``degrees(_:stream:)``
-public func radians(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_radians(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise remainder of division.
-///
-/// Computes the remainder of dividing `lhs` with `rhs` with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-///
-/// let r = remainder(a, 2) // e.g. a % 2
-/// ```
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func remainder(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_remainder(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Roll array elements along a given axis.
-///
-/// Elements that are rolled beyond the end of the array are introduced at the beggining and vice-versa.
-///
-/// - Parameters:
-///   - a: input array
-///   - shift: The number of places by which elements
-///     are shifted. If positive the array is rolled to the right, if
-///     negative it is rolled to the left.
-///   - axis: the axis along which to roll the elements
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:shapes>
-public func roll(_ a: MLXArray, shift: Int, axis: Int, stream: StreamOrDevice = .default)
-    -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_roll_axis(&result, a.ctx, [shift.int32], 1, axis.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Roll array elements along a given axis.
-///
-/// Elements that are rolled beyond the end of the array are introduced at the beggining and vice-versa.
-///
-/// - Parameters:
-///   - a: input array
-///   - shift: The number of places by which elements
-///     are shifted. If positive the array is rolled to the right, if
-///     negative it is rolled to the left.
-///   - axes: the axes along which to roll the elements, or all if omitted
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:shapes>
-public func roll(
-    _ a: MLXArray, shift: Int, axes: (some Collection<Int>)? = [Int]?.none,
-    stream: StreamOrDevice = .default
-)
-    -> MLXArray
-{
-    var result = mlx_array_new()
-    if let axes {
-        mlx_roll_axes(&result, a.ctx, [shift.int32], 1, axes.asInt32, axes.count, stream.ctx)
-    } else {
-        mlx_roll(&result, a.ctx, [shift.int32], 1, stream.ctx)
-    }
-    return MLXArray(result)
-}
-
-/// Element-wise logistic sigmoid.
-///
-/// For details, please see
-/// [this documentation](https://ml-explore.github.io/mlx/build/html/python/_autosummary/mlx.core.sigmoid.html)
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func sigmoid(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_sigmoid(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise sign.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func sign(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_sign(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise hyperbolic sine.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``sin(_:stream:)``
-public func sinh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_sinh(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-@available(*, deprecated, renamed: "softmax(_:axes:precise:stream:)")
-@_documentation(visibility: internal)
-public func softMax(
-    _ array: MLXArray, axes: some Collection<Int>, precise: Bool = false,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    softmax(array, axes: axes, precise: precise, stream: stream)
-}
-
-/// Perform the softmax along the given axis.
-///
-/// This operation is a numerically stable version of:
-///
-/// ```swift
-///exp(a) / sum(exp(a), axis, keepdims: true)
-/// ```
-///
-/// - Parameters:
-///     - array: input array
-///     - axes: axes to compute the softmax over
-///     - precise: if true, compute a more precise softmax by scaling the input
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``softmax(_:axis:precise:stream:)``
-/// - ``softmax(_:precise:stream:)``
-public func softmax(
-    _ array: MLXArray, axes: some Collection<Int>, precise: Bool = false,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_softmax_axes(&result, array.ctx, axes.asInt32, axes.count, precise, stream.ctx)
-    return MLXArray(result)
-}
-
-@available(*, deprecated, renamed: "softmax(_:axis:precise:stream:)")
-@_documentation(visibility: internal)
-public func softMax(
-    _ array: MLXArray, axis: Int, precise: Bool = false, stream: StreamOrDevice = .default
-) -> MLXArray {
-    softmax(array, axis: axis, precise: precise, stream: stream)
-}
-
-/// Perform the softmax along the given axis.
-///
-/// This operation is a numerically stable version of:
-///
-/// ```swift
-///exp(a) / sum(exp(a), axis, keepdims: true)
-/// ```
-///
-/// - Parameters:
-///     - array: input array
-///     - axis: axis to compute the softmax over
-///     - precise: if true, compute a more precise softmax by scaling the input
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``softmax(_:axes:precise:stream:)``
-/// - ``softmax(_:precise:stream:)``
-public func softmax(
-    _ array: MLXArray, axis: Int, precise: Bool = false, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_softmax_axis(&result, array.ctx, axis.int32, precise, stream.ctx)
-    return MLXArray(result)
-}
-
-@available(*, deprecated, renamed: "softmax(_:axis:precise:stream:)")
-@_documentation(visibility: internal)
-public func softMax(_ array: MLXArray, precise: Bool = false, stream: StreamOrDevice = .default)
-    -> MLXArray
-{
-    softmax(array, precise: precise, stream: stream)
-}
-
-/// Perform the softmax along the given axis.
-///
-/// This operation is a numerically stable version of:
-///
-/// ```swift
-///exp(a) / sum(exp(a), axis, keepdims: true)
-/// ```
-///
-/// - Parameters:
-///     - array: input array
-///     - precise: if true, compute a more precise softmax by scaling the input
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - ``softmax(_:axes:precise:stream:)``
-/// - ``softmax(_:axis:precise:stream:)``
-public func softmax(_ array: MLXArray, precise: Bool = false, stream: StreamOrDevice = .default)
-    -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_softmax(&result, array.ctx, precise, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Returns a sorted copy of the array.
-///
-/// - Parameters:
-///     - array: input array
-///     - axis: axis to sort over
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:sorting>
-/// - ``sorted(_:stream:)``
-/// - ``argSort(_:axis:stream:)``
-public func sorted(_ array: MLXArray, axis: Int, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_sort_axis(&result, array.ctx, axis.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Returns a sorted copy of the flattened array.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:sorting>
-/// - ``sorted(_:axis:stream:)``
-/// - ``argSort(_:axis:stream:)``
-public func sorted(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_sort(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Compute the standard deviation(s) over the given axes.
-///
-/// - Parameters:
-///   - array: input array
-///   - axes: axes to reduce over
-///   - keepDims: if `true` keep reduced axis as singleton dimension
-///   - ddof: the divisor to compute the varian is `N - ddof`
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:reduction>
-/// - ``std(_:axis:keepDims:ddof:stream:)``
-/// - ``std(_:keepDims:ddof:stream:)``
-public func std(
-    _ array: MLXArray, axes: some Collection<Int>, keepDims: Bool = false, ddof: Int = 0,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_std_axes(&result, array.ctx, axes.asInt32, axes.count, keepDims, ddof.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Compute the standard deviation over the given axis.
-///
-/// - Parameters:
-///   - array: input array
-///   - axis: axis to reduce over
-///   - keepDims: if `true` keep reduced axis as singleton dimension
-///   - ddof: the divisor to compute the varian is `N - ddof`
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:reduction>
-/// - ``std(_:axes:keepDims:ddof:stream:)``
-/// - ``std(_:keepDims:ddof:stream:)``
-public func std(
-    _ array: MLXArray, axis: Int, keepDims: Bool = false, ddof: Int = 0,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_std_axis(&result, array.ctx, axis.int32, keepDims, ddof.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Compute the standard deviations over all axes.
-///
-/// - Parameters:
-///   - array: input array
-///   - keepDims: if `true` keep reduced axis as singleton dimension
-///   - ddof: the divisor to compute the varian is `N - ddof`
-///   - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:reduction>
-/// - ``std(_:axes:keepDims:ddof:stream:)``
-/// - ``std(_:axis:keepDims:ddof:stream:)``
-public func std(
-    _ array: MLXArray, keepDims: Bool = false, ddof: Int = 0, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_std(&result, array.ctx, keepDims, ddof.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Stacks the arrays along a new axis.
-///
-/// ### See Also
-/// - <doc:shapes>
-public func stacked(
-    _ arrays: some Collection<MLXArray>, axis: Int = 0, stream: StreamOrDevice = .default
-)
-    -> MLXArray
-{
-    let vector_array = new_mlx_vector_array(arrays)
-    defer { mlx_vector_array_free(vector_array) }
-    var result = mlx_array_new()
-    mlx_stack_axis(&result, vector_array, axis.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Stop gradients from being computed.
-///
-///The operation is the identity but it prevents gradients from flowing
-/// through the array.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-public func stopGradient(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_stop_gradient(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise subtraction.
-///
-/// Subtract two arrays with <doc:broadcasting>.
-///
-/// For example:
-///
-/// ```swift
-/// let a = MLXArray(0 ..< 12, [4, 3])
-/// let b = MLXArray([4, 5, 6])
-///
-/// let r = subtract(a, b) // e.g. a - b
-/// ```
-///
-/// - Parameters:
-///     - a: the left hand side array
-///     - b: the right hand side array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func subtract(
-    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_subtract(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Take values along an axis at the specified indices.
-///
-/// - Parameters:
-///     - array: the left hand side array
-///     - indices: should be broadcastable to `array` excluding the `axis` dimension
-///     - axis: axis in the input to take the values from
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:indexes>
-/// - ``takeAlong(_:_:stream:)``
-public func takeAlong(
-    _ array: MLXArray, _ indices: MLXArray, axis: Int, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_take_along_axis(&result, array.ctx, indices.ctx, axis.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Take values along an axis at the specified indices from a flattened array.
-///
-/// - Parameters:
-///     - array: the left hand side array
-///     - indices: should be broadcastable to the flattened `array`
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:indexes>
-/// - ``takeAlong(_:_:axis:stream:)
-public func takeAlong(_ array: MLXArray, _ indices: MLXArray, stream: StreamOrDevice = .default)
-    -> MLXArray
-{
-    let array = array.reshaped([-1], stream: stream)
-    var result = mlx_array_new()
-    mlx_take_along_axis(&result, array.ctx, indices.ctx, 0, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise tangent.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func tan(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_tan(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Element-wise hyperbolic tangent.
-///
-/// - Parameters:
-///     - array: input array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func tanh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_tanh(&result, array.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Compute tensor dot product.
-///
-/// - Parameters:
-///   - a: input array
-///   - b: input array
-///   - axes: sum over the last `axes` dimensions
-///   - stream: stream or device to evaluate on
-/// - Returns: tensor dot product
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``tensordot(_:_:axes:stream:)-(MLXArray,MLXArray,Int,StreamOrDevice)``
-public func tensordot(
-    _ a: MLXArray, _ b: MLXArray, axes: Int = 1, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_tensordot_axis(&result, a.ctx, b.ctx, axes.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Compute tensor dot product.
-///
-/// - Parameters:
-///   - a: input array
-///   - b: input array
-///   - axes: two ranges for the `a` and `b` dimensions
-///   - stream: stream or device to evaluate on
-/// - Returns: tensor dot product
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``tensordot(_:_:axes:stream:)-(MLXArray,MLXArray,((Int,Int),(Int,Int)),StreamOrDevice)``
-public func tensordot(
-    _ a: MLXArray, _ b: MLXArray, axes: ((Int, Int), (Int, Int)), stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_tensordot(
-        &result,
-        a.ctx, b.ctx, [axes.0.0, axes.0.1].asInt32, 2, [axes.1.0, axes.1.1].asInt32, 2,
-        stream.ctx)
-    return MLXArray(result)
-}
-
-/// Compute tensor dot product.
-///
-/// - Parameters:
-///   - a: input array
-///   - b: input array
-///   - axes: multiple ranges for the `a` and `b` dimensions
-///   - stream: stream or device to evaluate on
-/// - Returns: tensor dot product
-///
-/// ### See Also
-/// - <doc:arithmetic>
-/// - ``tensordot(_:_:axes:stream:)``
-public func tensordot(
-    _ a: MLXArray, _ b: MLXArray, axes: (some Collection<Int>, some Collection<Int>),
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_tensordot(
-        &result,
-        a.ctx, b.ctx, axes.0.asInt32, axes.0.count, axes.1.asInt32, axes.1.count,
-        stream.ctx)
-    return MLXArray(result)
-}
-
-/// Construct array by repeating given array the number of times given by `repetitions`.
-///
-/// - Parameters:
-///   - array: input array
-///   - repetitions: number of repetitions for each axis
-///   - stream: stream or device to evaluate on
-/// - Returns: tiled array
-///
-/// ### See Also
-/// - <doc:shapes>
-/// - ``tiled(_:repetitions:stream:)-eouf``
-public func tiled(
-    _ array: MLXArray, repetitions: some Collection<Int>, stream: StreamOrDevice = .default
-)
-    -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_tile(&result, array.ctx, repetitions.asInt32, repetitions.count, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Construct array by repeating given array the number of times given by `repetitions`.
-///
-/// - Parameters:
-///   - array: input array
-///   - repetitions: number of repetitions for all axes
-///   - stream: stream or device to evaluate on
-/// - Returns: tiled array
-///
-/// ### See Also
-/// - <doc:shapes>
-/// - ``tiled(_:repetitions:stream:)-(MLXArray,Int,StreamOrDevice)``
-public func tiled(_ array: MLXArray, repetitions: Int, stream: StreamOrDevice = .default)
-    -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_tile(&result, array.ctx, [repetitions.int32], 1, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Returns the `k` largest elements from the input along a given axis.
-///
-/// The elements will not necessarily be in sorted order.
-///
-/// - Parameters:
-///     - array: input array
-///     - k: how many values
-///     - axis: axis to select over
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:sorting>
-/// - ``top(_:k:stream:)``
-public func top(_ array: MLXArray, k: Int, axis: Int = -1, stream: StreamOrDevice = .default)
-    -> MLXArray
-{
-    var result = mlx_array_new()
-    mlx_topk_axis(&result, array.ctx, k.int32, axis.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Returns the `k` largest elements from the flattened input along a given axis.
-///
-/// The elements will not necessarily be in sorted order.
-///
-/// - Parameters:
-///     - array: input array
-///     - k: how many values
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:sorting>
-/// - ``top(_:k:axis:stream:)``
-public func top(_ array: MLXArray, k: Int, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_topk(&result, array.ctx, k.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Return the sum along a specified diagonal in the given array.
-///
-/// - Parameters:
-///   - array: input array
-///   - offset: Offset of the diagonal from the main diagonal
-///   - axis1: The first axis of the 2-D sub-arrays from which the diagonals should be taken
-///   - axis2: The second axis of the 2-D sub-arrays from which the diagonals should be taken
-///   - dtype: Data type of the output array. If unspecified the output type is inferred from the input array.
-///   - stream: stream or device to evaluate on
-/// - Returns: sum of specified diagonal.
-///
-/// ### See Also
-/// - <doc:arithmetic>
-public func trace(
-    _ array: MLXArray, offset: Int = 0, axis1: Int = 0, axis2: Int = 1, dtype: DType? = nil,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_trace(
-        &result,
-        array.ctx, offset.int32, axis1.int32, axis2.int32, (dtype ?? array.dtype).cmlxDtype,
-        stream.ctx)
-    return MLXArray(result)
-}
-
-/// Zeros the array above the given diagonal.
-///
-/// - Parameters:
-///     - array: input array
-///     - k: the diagonal of the 2-D array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - ``triu(_:k:stream:)``
-public func tril(_ array: MLXArray, k: Int = 0, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_tril(&result, array.ctx, k.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Zeros the array below the given diagonal.
-///
-/// - Parameters:
-///     - array: input array
-///     - k: the diagonal of the 2-D array
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - ``tril(_:k:stream:)``
-public func triu(_ array: MLXArray, k: Int = 0, stream: StreamOrDevice = .default) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_triu(&result, array.ctx, k.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Select from `x` or `y` according to `condition`.
-///
-/// The condition and input arrays must be the same shape or <doc:broadcasting>
-/// with each another.
-///
-/// > ``which(_:_:_:stream:)`` may be easier to use (`where` is a Swift keyword).
-///
-/// - Parameters:
-///     - condition: condition array
-///     - a: input selected from where condiiton is non-zero or `true`
-///     - b: input selected from where condiiton is zero or `false`
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:logical>
-/// - ``which(_:_:_:stream:)``
-public func `where`(
-    _ condition: MLXArray, _ a: some ScalarOrArray, _ b: some ScalarOrArray,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_where(&result, condition.ctx, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Alias for ``where(_:_:_:stream:)`` -- select from `x` or `y` according to `condition`.
-///
-/// The condition and input arrays must be the same shape or <doc:broadcasting>
-/// with each another.
-///
-/// - Parameters:
-///     - condition: condition array
-///     - a: input selected from where condiiton is non-zero or `true`
-///     - b: input selected from where condiiton is zero or `false`
-///     - stream: stream or device to evaluate on
-///
-/// ### See Also
-/// - <doc:logical>
-/// - ``where(_:_:_:stream:)``
-public func which(
-    _ condition: MLXArray, _ a: some ScalarOrArray, _ b: some ScalarOrArray,
-    stream: StreamOrDevice = .default
-) -> MLXArray {
-    let (a, b) = toArrays(a, b)
-    var result = mlx_array_new()
-    mlx_where(&result, condition.ctx, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Compute the Kronecker product of two arrays `a` and `b`.
-///
-/// - Parameters:
-///     - a: input array
-///     - b: input array
-///     - stream: stream or device to evaluate on
-public func kron(
-    _ a: MLXArray, _ b: MLXArray, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_kron(&result, a.ctx, b.ctx, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Flatten an array.
-///
-/// The axes flattened will be between `start_axis` and `end_axis`,
-/// inclusive. Negative axes are supported. After converting negative axis to
-/// positive, axes outside the valid range will be clamped to a valid value,
-/// `start_axis` to `0` and `end_axis` to `ndim - 1`.
-///
-/// - Parameters:
-///     - a: input array
-///     - startAxis: first dim to flatten
-///     - endAxis: last dim to flatten
-///     - stream: stream or device to evaluate on
-public func flatten(
-    _ a: MLXArray, startAxis: Int, endAxis: Int = -1, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_flatten(&result, a.ctx, startAxis.int32, endAxis.int32, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Unflatten an axis of an array to a shape.
-///
-/// - Parameters:
-///     - a: input array
-///     - axis: axis to unflatten
-///     - shape: shape to unflatten into
-///     - stream: stream or device to evaluate on
-public func unflatten(
-    _ a: MLXArray, axis: Int, shape: some Collection<Int>, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_unflatten(&result, a.ctx, axis.int32, shape.map { Int32($0) }, shape.count, stream.ctx)
-    return MLXArray(result)
-}
-
-/// Force an array to be row contiguous. Copy if necessary.
-///
-/// - Parameters:
-///   - a: input array
-///   - allowColMajor: consider column major as contiguous and don’t copy
-///   - stream: stream or device to evaluate on
-/// - Returns: the row or col contiguous output.
-public func contiguous(
-    _ a: MLXArray, allowColMajor: Bool = false, stream: StreamOrDevice = .default
-) -> MLXArray {
-    var result = mlx_array_new()
-    mlx_contiguous(&result, a.ctx, allowColMajor, stream.ctx)
-    return MLXArray(result)
-}
+}
\ No newline at end of file

From de7d7390195c171f20f98e09bda391843960e8ee Mon Sep 17 00:00:00 2001
From: VDurocher <84510889+VDurocher@users.noreply.github.com>
Date: Tue, 7 Apr 2026 15:05:46 +0200
Subject: [PATCH 2/3] refactor: update Quantized.swift to use algebraic
 QuantizationMode

Update all default parameter values from .affine to .affine() to match
the new algebraic QuantizationMode enum where affine carries associated
values (groupSize and bits).
---
 Source/MLXNN/Quantized.swift | 30 +++++++++++++++---------------
 1 file changed, 15 insertions(+), 15 deletions(-)

diff --git a/Source/MLXNN/Quantized.swift b/Source/MLXNN/Quantized.swift
index 076e91ca..908764a3 100644
--- a/Source/MLXNN/Quantized.swift
+++ b/Source/MLXNN/Quantized.swift
@@ -16,7 +16,7 @@ public protocol Quantizable {
 
 extension Quantizable {
     public func toQuantized(groupSize: Int, bits: Int) -> Module {
-        toQuantized(groupSize: groupSize, bits: bits, mode: .affine)
+        toQuantized(groupSize: groupSize, bits: bits, mode: .affine())
     }
 }
 
@@ -29,10 +29,10 @@ public protocol Quantized: Module {
 
 /// Quantize any ``Quantizable`` layer that is not already quantized.
 public func quantizeSingle(
-    layer: Module, groupSize: Int = 64, bits: Int = 4, mode: QuantizationMode = .affine
+    layer: Module, groupSize: Int = 64, bits: Int = 4, mode: QuantizationMode = .affine()
 ) -> Quantized? {
     if layer is Quantized {
-        // already quantized
+        // Déjà quantifié — on ne le retraite pas
         nil
     } else if let quantizable = layer as? Quantizable {
         quantizable.toQuantized(groupSize: groupSize, bits: bits, mode: mode) as? Quantized
@@ -56,7 +56,7 @@ public func quantizeSingle(
 /// - ``quantize(model:filter:apply:)-(_,_,(Module,Int,Int,QuantizationMode)->Module?)``
 public func quantize(
     model: Module,
-    groupSize: Int = 64, bits: Int = 4, mode: QuantizationMode = .affine,
+    groupSize: Int = 64, bits: Int = 4, mode: QuantizationMode = .affine(),
     filter: (String, Module) -> Bool = { _, _ in true },
     apply: (Module, Int, Int, QuantizationMode) -> Module? = quantizeSingle(
         layer:groupSize:bits:mode:)
@@ -84,11 +84,11 @@ public func quantize(
     model: Module, groupSize: Int = 64, bits: Int = 4,
     filter: (String, Module) -> Bool = { _, _ in true },
     apply: (Module, Int, Int) -> Module? = {
-        quantizeSingle(layer: $0, groupSize: $1, bits: $2, mode: .affine)
+        quantizeSingle(layer: $0, groupSize: $1, bits: $2, mode: .affine())
     }
 ) {
     quantize(
-        model: model, groupSize: groupSize, bits: bits, mode: .affine, filter: filter,
+        model: model, groupSize: groupSize, bits: bits, mode: .affine(), filter: filter,
         apply: { l, g, b, n in apply(l, g, b) }
     )
 }
@@ -132,14 +132,14 @@ public func quantize(
     model: Module,
     filter: (String, Module) -> (groupSize: Int, bits: Int)?,
     apply: (Module, Int, Int) -> Module? = {
-        quantizeSingle(layer: $0, groupSize: $1, bits: $2, mode: .affine)
+        quantizeSingle(layer: $0, groupSize: $1, bits: $2, mode: .affine())
     }
 ) {
     quantize(
         model: model,
         filter: {
             if let (g, b) = filter($0, $1) {
-                return (g, b, .affine)
+                return (g, b, .affine())
             } else {
                 return nil
             }
@@ -167,7 +167,7 @@ open class QuantizedEmbedding: Embedding, Quantized {
 
     convenience public init(
         embeddingCount: Int, dimensions: Int, groupSize: Int = 64, bits: Int = 4,
-        mode: QuantizationMode = .affine
+        mode: QuantizationMode = .affine()
     ) {
         let scale = sqrt(1 / Float(dimensions))
         let weight = MLXRandom.normal([embeddingCount, dimensions]) * scale
@@ -177,14 +177,14 @@ open class QuantizedEmbedding: Embedding, Quantized {
 
     public convenience init(
         _ other: Embedding, groupSize: Int = 64, bits: Int = 4,
-        mode: QuantizationMode = .affine
+        mode: QuantizationMode = .affine()
     ) {
         self.init(weight: other.weight, groupSize: groupSize, bits: bits, mode: mode)
     }
 
     public init(
         weight: MLXArray, groupSize: Int = 64, bits: Int = 4,
-        mode: QuantizationMode = .affine
+        mode: QuantizationMode = .affine()
     ) {
         self.groupSize = groupSize
         self.bits = bits
@@ -263,7 +263,7 @@ open class QuantizedLinear: Linear, Quantized {
     public convenience init(
         _ inputDimensions: Int, _ outputDimensions: Int,
         bias: Bool = true, groupSize: Int = 64, bits: Int = 4,
-        mode: QuantizationMode = .affine
+        mode: QuantizationMode = .affine()
     ) {
         let scale = sqrt(1 / Float(inputDimensions))
         let weight = MLXRandom.uniform(
@@ -283,7 +283,7 @@ open class QuantizedLinear: Linear, Quantized {
     ///   - mode: quantization mode
     public convenience init(
         _ other: Linear, groupSize: Int = 64, bits: Int = 4,
-        mode: QuantizationMode = .affine
+        mode: QuantizationMode = .affine()
     ) {
         self.init(
             weight: other.weight, bias: other.bias, groupSize: groupSize, bits: bits, mode: mode)
@@ -292,7 +292,7 @@ open class QuantizedLinear: Linear, Quantized {
     /// Initialize a ``QuantizedLinear`` with non-quantized weights and bias.
     public init(
         weight: MLXArray, bias: MLXArray?, groupSize: Int = 64, bits: Int = 4,
-        mode: QuantizationMode = .affine
+        mode: QuantizationMode = .affine()
     ) {
         self.groupSize = groupSize
         self.bits = bits
@@ -316,7 +316,7 @@ open class QuantizedLinear: Linear, Quantized {
     public init(
         weight: MLXArray, bias: MLXArray? = nil, scales: MLXArray, biases: MLXArray?,
         groupSize: Int, bits: Int,
-        mode: QuantizationMode = .affine
+        mode: QuantizationMode = .affine()
     ) {
         self.groupSize = groupSize
         self.bits = bits

From d0fdafa50c83eb190941cb224f87ab640c9fe6d0 Mon Sep 17 00:00:00 2001
From: VDurocher <84510889+VDurocher@users.noreply.github.com>
Date: Tue, 7 Apr 2026 15:07:24 +0200
Subject: [PATCH 3/3] refactor: make QuantizationMode an algebraic enum with
 associated values

- Convert QuantizationMode from String raw value enum to algebraic enum
- Add case affine(groupSize: Int = 64, bits: Int = 4) with associated values
- Keep mxfp4, mxfp8, nvfp4 as simple cases with fixed parameters
- Add cName computed property to replace rawValue for C API calls
- Add groupSize and bits computed properties on QuantizationMode
- Add manual Codable conformance (associated values prevent String raw type)
- Add Equatable conformance (auto-synthesized by Swift)
- Update all call sites: mode.rawValue -> mode.cName
- Update all default parameter values: .affine -> .affine()

Closes #285
---
 Source/MLX/Ops.swift | 3365 +++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 3364 insertions(+), 1 deletion(-)

diff --git a/Source/MLX/Ops.swift b/Source/MLX/Ops.swift
index 65d4e73c..871ed948 100644
--- a/Source/MLX/Ops.swift
+++ b/Source/MLX/Ops.swift
@@ -15,4 +15,3367 @@ func broadcast(arrays: some Collection<MLXArray>, stream: StreamOrDevice = .defa
     defer { mlx_vector_array_free(result) }
 
     return mlx_vector_array_values(result)
-}
\ No newline at end of file
+}
+
+/// Element-wise addition.
+///
+/// Add two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = MLXArray([4, 5, 6])
+///
+/// // equivalent to a + b + 7
+/// let r = add(add(a, b), 7)
+/// ```
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``MLXArray/+(_:_:)-(MLXArray,MLXArray)``
+public func add(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_add(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+@available(*, deprecated, renamed: "addMM(_:_:_:alpha:beta:stream:)")
+@_documentation(visibility: internal)
+public func addmm<A: ScalarOrArray, B: ScalarOrArray, C: ScalarOrArray>(
+    _ c: C, _ a: A, _ b: B, alpha: Float = 1.0, beta: Float = 1.0, stream: StreamOrDevice = .default
+) -> MLXArray {
+    addMM(c, a, b, alpha: alpha, beta: beta, stream: stream)
+}
+
+/// Matrix multiplication with addition and optional scaling.
+///
+/// Perform the (possibly batched) matrix multiplication of two arrays and add to the result
+/// with optional scaling factors.
+///
+/// Equivalent to:
+///
+/// ```swift
+/// alpha * matmul(a, b) + beta * c
+/// ```
+///
+/// > Note the ordering of the parameters
+///
+/// - Parameters:
+///   - c: input array or scalar
+///   - a: input array or scalar
+///   - b: input array or scalar
+///   - alpha: optional scaling for the matrix product of `a` and `b`
+///   - beta: optional scaling factor for `c`
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - ``matmul(_:_:stream:)``
+/// - ``blockMaskedMM(_:_:blockSize:maskOut:maskLHS:maskRHS:stream:)``
+public func addMM(
+    _ c: some ScalarOrArray, _ a: some ScalarOrArray, _ b: some ScalarOrArray, alpha: Float = 1.0,
+    beta: Float = 1.0, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    let (_, c) = toArrays(a, c)
+    var result = mlx_array_new()
+    mlx_addmm(&result, c.ctx, a.ctx, b.ctx, alpha, beta, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise inverse cosine.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``cos(_:stream:)``
+public func acos(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_arccos(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise inverse hyperbolic cosine.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``cosh(_:stream:)``
+public func acosh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_arccosh(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise inverse sine.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``sin(_:stream:)``
+public func asin(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_arcsin(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise inverse hyperbolic sine.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``sinh(_:stream:)``
+public func asinh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_arcsinh(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise inverse tangent.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``tan(_:stream:)``
+public func atan(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_arctan(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise inverse tangent of the ratio of two arrays.
+///
+/// - Parameters:
+///   - a: first input array
+///   - b: second input array
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``atan(_:stream:)``
+public func atan2(_ a: MLXArray, _ b: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_arctan2(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise inverse hyperbolic tangent.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``tanh(_:stream:)``
+public func atanh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_arctanh(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Convert array to have at least 1 dimension.
+///
+/// ### See Also
+/// - <doc:shapes>
+public func atLeast1D(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_atleast_1d(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Convert array to have at least 2 dimensions.
+///
+/// ### See Also
+/// - <doc:shapes>
+public func atLeast2D(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_atleast_2d(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Convert array to have at least 3 dimensions.
+///
+/// ### See Also
+/// - <doc:shapes>
+public func atLeast3D(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_atleast_3d(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Returns the indices that partition the array.
+///
+/// The ordering of the elements within a partition in given by the indices is undefined.
+///
+/// For example:
+///
+/// ```swift
+/// // array with values in random order
+/// let array = MLXRandom.randInt(0 ..< 100, [10])
+///
+/// let partitionIndexes = argPartition(array, kth: 3)
+///
+/// // the partitioned array.  the pivot is at partitioned[3] and all values
+/// // with lower indexes will be less than (in undefined order)
+/// let partitioned = array[sortIndexes]
+/// ```
+///
+/// - Parameters:
+///     - array: input array
+///     - kth: element index at the `kth` position in the output will give the sorted position.  All indices before the`kth` position will be of elements less than or equal to the element at the `kth` index and all indices after will be elemenents greater than or equal to the element at the `kth` position.
+///     - axis: axis to partition over
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:indexes>
+/// - ``argPartition(_:kth:stream:)``
+/// - ``partitioned(_:kth:axis:stream:)``
+public func argPartition(_ array: MLXArray, kth: Int, axis: Int, stream: StreamOrDevice = .default)
+    -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_argpartition_axis(&result, array.ctx, kth.int32, axis.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Returns the indices that partition the flattened array.
+///
+/// The ordering of the elements within a partition in given by the indices is undefined.
+///
+/// - Parameters:
+///     - array: input array
+///     - kth: element index at the `kth` position in the output will give the sorted position.  All indices before the`kth` position will be of elements less than or equal to the element at the `kth` index and all indices after will be elemenents greater than or equal to the element at the `kth` position.
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:indexes>
+/// - ``argPartition(_:kth:axis:stream:)``
+/// - ``partitioned(_:kth:axis:stream:)``
+public func argPartition(_ array: MLXArray, kth: Int, stream: StreamOrDevice = .default) -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_argpartition(&result, array.ctx, kth.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Returns the indices that sort the array.
+///
+/// ```swift
+/// // array with values in random order
+/// let array = MLXRandom.randInt(0 ..< 100, [10])
+///
+/// let sortIndexes = argSort(array, axis: -1)
+///
+/// // the array in sorted order
+/// let sorted = array[sortIndexes]
+/// ```
+///
+/// - Parameters:
+///     - array: input array
+///     - axis: axis to sort over
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:indexes>
+/// - ``argSort(_:stream:)``
+public func argSort(_ array: MLXArray, axis: Int, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_argsort_axis(&result, array.ctx, axis.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Returns the indices that sort the array.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:indexes>
+/// - ``argSort(_:axis:stream:)``
+public func argSort(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_argsort(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Create a view into the array with the given shape and strides.
+///
+/// The resulting array will always be as if the provided array was row
+/// contiguous regardless of the provided arrays storage order and current strides.
+///
+/// > Note: This function should be used with caution as it changes
+/// the shape and strides of the array directly. This can lead to the
+/// resulting array pointing to invalid memory locations which can
+/// result into crashes.
+///
+/// Here are two examples of use:
+///
+/// ```swift
+/// // strides in the reverse order is a transpose
+/// let a = MLXArray(0 ..< 12, [4, 3])
+///
+/// let transposed = asStrided(a, [3, 4], strides: [1, 3])
+/// ```
+///
+/// and:
+///
+/// ```swift
+/// // negative strides and an offset produce a reversed array
+/// let a = MLXArray(0 ..< 16, [4, 4])
+///
+/// let b = asStrided(a, [4, 4], strides: [-4, -1], offset: 15)
+/// let same = MLXArray((0 ..< 16).reversed(), [4, 4])
+/// ```
+///
+/// - Parameters:
+///     - array: input array
+///     - shape: The shape of the resulting array. If not specified it defaults to `array.shape`
+///     - strides: The strides of the resulting array. If not specified it defaults to the reverse
+///                exclusive cumulative product of `array.shape`
+///     - offset: Skip that many elements from the beginning of the input array
+///     - stream: stream or device to evaluate on
+///
+/// - Returns: The output array which is the strided view of the input
+///
+/// ### See Also
+/// - <doc:shapes>
+public func asStrided(
+    _ array: MLXArray, _ shape: (some Collection<Int>)? = [Int]?.none,
+    strides: (some Collection<Int>)? = [Int]?.none, offset: Int = 0,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    let shape = shape.map { Array($0) } ?? array.shape
+
+    let resolvedStrides: [Int64]
+    if let strides {
+        resolvedStrides = strides.map { .init($0) }
+    } else {
+        var result = [Int64]()
+        var cum = 1
+        for v in shape.reversed() {
+            result.append(Int64(cum))
+            cum = cum * v
+        }
+        resolvedStrides = result.reversed()
+    }
+
+    var result = mlx_array_new()
+    mlx_as_strided(
+        &result,
+        array.ctx, shape.asInt32, shape.count, resolvedStrides, resolvedStrides.count,
+        offset,
+        stream.ctx)
+    return MLXArray(result)
+}
+
+/// Return the Bartlett window.
+///
+/// The Bartlett window is a taper formed by using a weighted cosine.
+///
+/// - Parameters:
+///   - m: number of points in the output window
+///   - stream: stream to evaluate on
+/// - Returns: The window, with the maximum value normalized to one (the value one appears only if
+///     the number of samples is odd).
+public func bartlett(
+    _ m: Int, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_bartlett(&result, Int32(m), stream.ctx)
+    return MLXArray(result)
+}
+
+/// Return the Blackman window.
+///
+/// The Blackman window is a taper formed by using the first three terms of a summation of cosines.
+///
+/// - Parameters:
+///   - m: number of points in the output window
+///   - stream: stream to evaluate on
+/// - Returns: The window, with the maximum value normalized to one (the value one appears only if
+///     the number of samples is odd).
+public func blackman(
+    _ m: Int, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_blackman(&result, Int32(m), stream.ctx)
+    return MLXArray(result)
+}
+
+/// Matrix multiplication with block masking.
+///
+/// Perform the (possibly batched) matrix multiplication of two arrays and with blocks
+/// of size `blockSize x blockSize` optionally masked out.
+///
+/// Assuming `a` with shape (..., `M`, `K`) and b with shape (..., `K`, `N`)
+///
+/// * `maskLHS` must have shape (..., ceil(`M` / `blockSize`), ceil(`K` / `blockSize`))
+///
+/// * `maskRHS` must have shape (..., ceil(`K` / `blockSize`), ceil(`N` / `blockSize`))
+///
+/// * `maskOut` must have shape (..., ceil(`M` / `blockSize`), ceil(`N` / `blockSize`))
+///
+/// > Note: Only `block_size=64` and `block_size=32` are currently supported
+///
+/// - Parameters:
+///   - a: input array
+///   - b: input array
+///   - blockSize: Size of blocks to be masked. Must be `32` or `64`
+///   - maskOut: Boolean mask for output
+///   - maskLHS: Boolean mask for a
+///   - maskRHS: Boolean mask for b
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``multiply(_:_:stream:)``
+/// - ``addMM(_:_:_:alpha:beta:stream:)``
+/// - ``MLXArray/matmul(_:stream:)``
+/// - ``matmul(_:_:stream:)``
+public func blockMaskedMM(
+    _ a: MLXArray, _ b: MLXArray, blockSize: Int = 64, maskOut: MLXArray? = nil,
+    maskLHS: MLXArray? = nil, maskRHS: MLXArray? = nil, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+
+    mlx_block_masked_mm(
+        &result,
+        a.ctx, b.ctx, blockSize.int32, (maskOut ?? .mlxNone).ctx, (maskLHS ?? .mlxNone).ctx,
+        (maskRHS ?? .mlxNone).ctx, stream.ctx)
+
+    return MLXArray(result)
+}
+
+/// Broadcast an array to the given shape.
+///
+/// - Parameters:
+///     - array: input array
+///     - shape: shape to broadcast to
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:broadcasting>
+public func broadcast(
+    _ array: MLXArray, to shape: some Collection<Int>, stream: StreamOrDevice = .default
+)
+    -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_broadcast_to(&result, array.ctx, shape.asInt32, shape.count, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise ceil.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``floor(_:stream:)``
+public func ceil(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_ceil(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Clip the values of the array between the given minimum and maximum.
+///
+/// - Parameters:
+///     - array: input array
+///     - min: minimum value (must broadcast to `array`)
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``clip(_:max:stream:)``
+/// - ``clip(_:min:max:stream:)``
+public func clip(
+    _ array: MLXArray, min: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (array, min) = toArrays(array, min)
+    var result = mlx_array_new()
+    let max = mlx_array_new()
+    defer { mlx_array_free(max) }
+    mlx_clip(&result, array.ctx, min.ctx, max, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Clip the values of the array between the given minimum and maximum.
+///
+/// - Parameters:
+///     - array: input array
+///     - min: minimum value (must broadcast to `array`)
+///     - max: maximum value (must broadcast to `array`).  If omitted only the `min` will be honored.
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``clip(_:max:stream:)``
+public func clip(
+    _ array: MLXArray, min: some ScalarOrArray, max: some ScalarOrArray,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (array, min) = toArrays(array, min)
+    let (_, max) = toArrays(array, max)
+    var result = mlx_array_new()
+    mlx_clip(&result, array.ctx, min.ctx, max.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Clip the values of the array up to the given maximum.
+///
+/// - Parameters:
+///     - array: input array
+///     - max: maximum value (must broadcast to `array`)
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``clip(_:min:stream:)``
+/// - ``clip(_:min:max:stream:)``
+public func clip(_ array: MLXArray, max: some ScalarOrArray, stream: StreamOrDevice = .default)
+    -> MLXArray
+{
+    let (array, max) = toArrays(array, max)
+    var result = mlx_array_new()
+    let min = mlx_array_new()
+    defer { mlx_array_free(min) }
+    mlx_clip(&result, array.ctx, min, max.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Concatenate the arrays along the given axis.
+///
+/// - Parameters:
+///     - arrays: input arrays to concatenate
+///     - axis: the axis along which to concatenate
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:shapes>
+public func concatenated(
+    _ arrays: some Collection<MLXArray>, axis: Int = 0, stream: StreamOrDevice = .default
+)
+    -> MLXArray
+{
+    let vector_array = new_mlx_vector_array(arrays)
+    defer { mlx_vector_array_free(vector_array) }
+
+    var result = mlx_array_new()
+    mlx_concatenate_axis(&result, vector_array, axis.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// 1D convolution over an input with several channels.
+///
+/// > Only the default `groups=1` is currently supported.
+///
+/// - Parameters:
+///     - array: input array of shape `[N, H, C_in]`
+///     - weight: weight array of shape `[C_out, H, C_in]`
+///     - stride: kernel stride
+///     - padding: input padding
+///     - dilation: kernel dilation
+///     - groups: input feature groups
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:convolution>
+/// - ``conv2d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``conv3d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``convolve(_:_:mode:stream:)``
+public func conv1d(
+    _ array: MLXArray, _ weight: MLXArray, stride: Int = 1, padding: Int = 0, dilation: Int = 1,
+    groups: Int = 1, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_conv1d(
+        &result,
+        array.ctx, weight.ctx, stride.int32, padding.int32, dilation.int32, groups.int32,
+        stream.ctx)
+    return MLXArray(result)
+}
+
+/// 2D convolution over an input with several channels.
+///
+/// > Only the default `groups=1` is currently supported.
+///
+/// The numeric parameters may be given as single values:
+///
+/// ```swift
+/// padding: 1
+/// ```
+///
+/// This will produce a padding of `(1, 1)`.  You can also give an array:
+///
+/// ```swift
+/// padding: [2, 3]
+/// ```
+///
+/// See ``IntOrPair`` for more information.
+///
+/// - Parameters:
+///     - array: input array of shape `[N, H, W, C_in]`
+///     - weight: weight array of shape `[C_out, H, W, C_in]`
+///     - stride: kernel stride
+///     - padding: input padding
+///     - dilation: kernel dilation
+///     - groups: input feature groups
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:convolution>
+/// - ``IntOrPair``
+/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``conv3d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``convolve(_:_:mode:stream:)``
+/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,IntOrArray,IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
+public func conv2d(
+    _ array: MLXArray, _ weight: MLXArray, stride: IntOrPair = 1, padding: IntOrPair = 0,
+    dilation: IntOrPair = 1, groups: Int = 1, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_conv2d(
+        &result,
+        array.ctx, weight.ctx, stride.first.int32, stride.second.int32, padding.first.int32,
+        padding.second.int32, dilation.first.int32, dilation.second.int32, groups.int32,
+        stream.ctx)
+    return MLXArray(result)
+}
+
+/// 3D convolution over an input with several channels.
+///
+/// > Only the default `groups=1` is currently supported.
+///
+/// The numeric parameters may be given as single values:
+///
+/// ```swift
+/// padding: 1
+/// ```
+///
+/// This will produce a padding of `(1, 1, 1)`.  You can also give an array:
+///
+/// ```swift
+/// padding: [2, 3, 3]
+/// ```
+///
+/// See ``IntOrTriple`` for more information.
+///
+/// - Parameters:
+///     - array: input array of shape `[N, D, H, W, C_in]`
+///     - weight: weight array of shape `[C_out, D, H, W, C_in]`
+///     - stride: kernel stride
+///     - padding: input padding
+///     - dilation: kernel dilation
+///     - groups: input feature groups
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:convolution>
+/// - ``IntOrTriple``
+/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``conv2d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``convolve(_:_:mode:stream:)``
+/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,IntOrArray,IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
+public func conv3d(
+    _ array: MLXArray, _ weight: MLXArray, stride: IntOrTriple = 1, padding: IntOrTriple = 0,
+    dilation: IntOrTriple = 1, groups: Int = 1, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_conv3d(
+        &result,
+        array.ctx, weight.ctx,
+        stride.first.int32, stride.second.int32, stride.third.int32,
+        padding.first.int32, padding.second.int32, padding.third.int32,
+        dilation.first.int32, dilation.second.int32, dilation.third.int32,
+        groups.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// General convolution over an input with several channels.
+///
+/// > Only 1d and 2d convolutions are supported at the moment
+///
+/// > the default `groups: 1` is currently supported
+///
+/// - Parameters:
+///   - array: Input array of shape `(N, ..., C_in)`
+///   - weight: Weight array of shape `(C_out, ..., C_in)`
+///   - strides: `Int` or `some Collection<Int>` with kernel strides.  All dimensions get the
+///   same stride if only one number is specified.
+///   - padding: `Int` or `some Collection<Int>` with input padding.  All dimensions get the
+///   same padding if only one number is specified.
+///   - kernelDilation: `Int` or `some Collection<Int>` with kernel dilation.  All dimensions get the
+///   same dilation if only one number is specified.
+///   - inputDilation: `Int` or `some Collection<Int>` with input dilation.  All dimensions get the
+///   same dilation if only one number is specified.
+///   - groups: input feature groups
+///   - flip: Flip the order in which the spatial dimensions of the weights are processed.
+///   Performs the cross-correlation operator when `flip` is `false` and the convolution
+///   operator otherwise.
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:convolution>
+/// - ``IntOrArray``
+/// - ``conv2d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,(Int,Int),IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
+public func convGeneral(
+    _ array: MLXArray, _ weight: MLXArray, strides: IntOrArray = 1, padding: IntOrArray = 0,
+    kernelDilation: IntOrArray = 1, inputDilation: IntOrArray = 1, groups: Int = 1,
+    flip: Bool = false,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_conv_general(
+        &result,
+        array.ctx, weight.ctx,
+        strides.asInt32Array, strides.count,
+        padding.asInt32Array, padding.count,
+        padding.asInt32Array, padding.count,
+        kernelDilation.asInt32Array, kernelDilation.count,
+        inputDilation.asInt32Array, inputDilation.count,
+        groups.int32, flip, stream.ctx)
+    return MLXArray(result)
+}
+
+/// General convolution over an input with several channels with a padding pair.
+///
+/// > Only 1d and 2d convolutions are supported at the moment
+///
+/// > the default `groups: 1` is currently supported
+///
+/// - Parameters:
+///   - array: Input array of shape `(N, ..., C_in)`
+///   - weight: Weight array of shape `(C_out, ..., C_in)`
+///   - strides: `Int` or `some Collection<Int>` with kernel strides.  All dimensions get the
+///   same stride if only one number is specified.
+///   - padding: pair of padding values to apply to all dimensions
+///   - kernelDilation: `Int` or `some Collection<Int>` with kernel dilation.  All dimensions get the
+///   same dilation if only one number is specified.
+///   - inputDilation: `Int` or `some Collection<Int>` with input dilation.  All dimensions get the
+///   same dilation if only one number is specified.
+///   - groups: input feature groups
+///   - flip: Flip the order in which the spatial dimensions of the weights are processed.
+///   Performs the cross-correlation operator when `flip` is `false` and the convolution
+///   operator otherwise.
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:convolution>
+/// - ``IntOrArray``
+/// - ``conv2d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,(Int,Int),IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
+public func convGeneral(
+    _ array: MLXArray, _ weight: MLXArray, strides: IntOrArray = 1, padding: (Int, Int),
+    kernelDilation: IntOrArray = 1, inputDilation: IntOrArray = 1, groups: Int = 1,
+    flip: Bool = false,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_conv_general(
+        &result,
+        array.ctx, weight.ctx,
+        strides.asInt32Array, strides.count,
+        [padding.0.int32], 1,
+        [padding.1.int32], 1,
+        kernelDilation.asInt32Array, kernelDilation.count,
+        inputDilation.asInt32Array, inputDilation.count,
+        groups.int32, flip, stream.ctx)
+    return MLXArray(result)
+}
+
+/// 1D transposed convolution over an input with several channels.
+///
+/// > Only the default `groups=1` is currently supported.
+///
+/// - Parameters:
+///     - array: input array of shape `[N, H, C_in]`
+///     - weight: weight array of shape `[C_out, H, C_in]`
+///     - stride: kernel stride
+///     - padding: input padding
+///     - dilation: kernel dilation
+///     - outputPadding: output padding
+///     - groups: input feature groups
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:convolution>
+/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``convTransposed2d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
+/// - ``convTransposed3d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
+/// - ``convolve(_:_:mode:stream:)``
+public func convTransposed1d(
+    _ array: MLXArray, _ weight: MLXArray, stride: Int = 1, padding: Int = 0,
+    dilation: Int = 1, outputPadding: Int = 0, groups: Int = 1,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_conv_transpose1d(
+        &result,
+        array.ctx, weight.ctx, stride.int32, padding.int32,
+        dilation.int32, outputPadding.int32, groups.int32,
+        stream.ctx)
+    return MLXArray(result)
+}
+
+/// 2D transposed convolution over an input with several channels.
+///
+/// > Only the default `groups=1` is currently supported.
+///
+/// The numeric parameters may be given as single values:
+///
+/// ```swift
+/// padding: 1
+/// ```
+///
+/// This will produce a padding of `(1, 1)`.  You can also give an array:
+///
+/// ```swift
+/// padding: [2, 3]
+/// ```
+///
+/// See ``IntOrPair`` for more information.
+///
+/// - Parameters:
+///     - array: input array of shape `[N, H, W, C_in]`
+///     - weight: weight array of shape `[C_out, H, W, C_in]`
+///     - stride: kernel stride
+///     - padding: input padding
+///     - dilation: kernel dilation
+///     - outputPadding: output padding
+///     - groups: input feature groups
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:convolution>
+/// - ``IntOrPair``
+/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``convTransposed1d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
+/// - ``convTransposed3d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
+/// - ``convolve(_:_:mode:stream:)``
+/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,IntOrArray,IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
+public func convTransposed2d(
+    _ array: MLXArray, _ weight: MLXArray, stride: IntOrPair = 1, padding: IntOrPair = 0,
+    dilation: IntOrPair = 1, outputPadding: IntOrPair = 0, groups: Int = 1,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_conv_transpose2d(
+        &result,
+        array.ctx, weight.ctx, stride.first.int32, stride.second.int32, padding.first.int32,
+        padding.second.int32, dilation.first.int32, dilation.second.int32,
+        outputPadding.first.int32, outputPadding.second.int32, groups.int32,
+        stream.ctx)
+    return MLXArray(result)
+}
+
+/// 3D transposed convolution over an input with several channels.
+///
+/// > Only the default `groups=1` is currently supported.
+///
+/// The numeric parameters may be given as single values:
+///
+/// ```swift
+/// padding: 1
+/// ```
+///
+/// This will produce a padding of `(1, 1, 1)`.  You can also give an array:
+///
+/// ```swift
+/// padding: [2, 3, 3]
+/// ```
+///
+/// See ``IntOrTriple`` for more information.
+///
+/// - Parameters:
+///     - array: input array of shape `[N, D, H, W, C_in]`
+///     - weight: weight array of shape `[C_out, D, H, W, C_in]`
+///     - stride: kernel stride
+///     - padding: input padding
+///     - dilation: kernel dilation
+///     - outputPadding: output padding
+///     - groups: input feature groups
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:convolution>
+/// - ``IntOrTriple``
+/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``convTransposed1d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
+/// - ``convTransposed3d(_:_:stride:padding:dilation:outputPadding:groups:stream:)``
+/// - ``convolve(_:_:mode:stream:)``
+/// - ``convGeneral(_:_:strides:padding:kernelDilation:inputDilation:groups:flip:stream:)-(MLXArray,MLXArray,IntOrArray,IntOrArray,IntOrArray,IntOrArray,Int,Bool,StreamOrDevice)``
+public func convTransposed3d(
+    _ array: MLXArray, _ weight: MLXArray, stride: IntOrTriple = 1, padding: IntOrTriple = 0,
+    dilation: IntOrTriple = 1, outputPadding: IntOrTriple = 0, groups: Int = 1,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_conv_transpose3d(
+        &result,
+        array.ctx, weight.ctx,
+        stride.first.int32, stride.second.int32, stride.third.int32,
+        padding.first.int32, padding.second.int32, padding.third.int32,
+        dilation.first.int32, dilation.second.int32, dilation.third.int32,
+        outputPadding.first.int32, outputPadding.second.int32, outputPadding.third.int32,
+        groups.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Mode for ``convolve(_:_:mode:stream:)``
+public enum ConvolveMode: Sendable {
+    case full
+    case valid
+    case same
+}
+
+/// The discrete convolution of 1D arrays.
+///
+/// - Parameters:
+///     - a: 1D input array
+///     - b: 1D input array
+///     - mode: padding mode
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:convolution>
+/// - ``conv1d(_:_:stride:padding:dilation:groups:stream:)``
+/// - ``conv2d(_:_:stride:padding:dilation:groups:stream:)``
+public func convolve(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, mode: ConvolveMode = .full,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+
+    precondition(a.ndim == 1, "inputs must be 1d (a)")
+    precondition(b.ndim == 1, "inputs must be 1d (b)")
+
+    var (input, weight) = a.size < b.size ? (b, a) : (a, b)
+
+    var slice = mlx_array_new()
+    mlx_slice(
+        &slice,
+        weight.ctx, [weight.dim(0) - 1].asInt32, 1, [-weight.dim(0) - 1].asInt32, 1, [-1], 1,
+        stream.ctx)
+    weight = MLXArray(slice)
+
+    weight = weight.reshaped([1, -1, 1], stream: stream)
+    input = input.reshaped([1, -1, 1], stream: stream)
+
+    let weightSize = weight.size
+    var padding = 0
+
+    switch mode {
+    case .full:
+        padding = weightSize - 1
+    case .valid:
+        padding = 0
+    case .same:
+        if weightSize % 2 == 1 {
+            padding = weightSize / 2
+        } else {
+            let padLeft = weightSize / 2
+            let padRight = max(0, padLeft / 2 - 1)
+
+            input = padded(input, widths: [0, [padLeft, padRight], 0], stream: stream)
+        }
+    }
+
+    var result = mlx_array_new()
+    mlx_conv1d(&result, input.ctx, weight.ctx, 1, padding.int32, 1, 1, stream.ctx)
+    return MLXArray(result).reshaped(-1, stream: stream)
+}
+
+/// Element-wise hyperbolic cosine.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``cos(_:stream:)``
+public func cosh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_cosh(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Convert angles from radians to degrees.
+///
+/// - Parameters:
+///   - array: input array
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``radians(_:stream:)``
+public func degrees(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_degrees(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Insert dependencies between arrays in the graph. The outputs are
+/// identical to `input` but with dependencies on `dependencies`.
+///
+/// - Parameters:
+///   - input: input array
+///   - dependencies: arrays to depend on
+/// - Returns: output which depends on the `dependencies`
+///
+/// ### See Also
+/// - ``depends(inputs:dependencies:)``
+public func depends(input: MLXArray, dependencies: [MLXArray]) -> MLXArray {
+    var result = mlx_vector_array_new()
+    defer { mlx_vector_array_free(result) }
+    let inputs = new_mlx_vector_array([input])
+    defer { mlx_vector_array_free(inputs) }
+    let dependencies = new_mlx_vector_array(dependencies)
+    defer { mlx_vector_array_free(dependencies) }
+    mlx_depends(&result, inputs, dependencies)
+
+    let arrays = mlx_vector_array_values(result)
+    return arrays[0]
+}
+
+/// Insert dependencies between arrays in the graph. The outputs are
+/// identical to `inputs` but with dependencies on `dependencies`.
+///
+/// - Parameters:
+///   - inputs: input arrays
+///   - dependencies: arrays to depend on
+/// - Returns: outputs which depends on the `dependencies`
+///
+/// ### See Also
+/// - ``depends(input:dependencies:)``
+public func depends(inputs: [MLXArray], dependencies: [MLXArray]) -> [MLXArray] {
+    var result = mlx_vector_array_new()
+    defer { mlx_vector_array_free(result) }
+    let inputs = new_mlx_vector_array(inputs)
+    defer { mlx_vector_array_free(inputs) }
+    let dependencies = new_mlx_vector_array(dependencies)
+    defer { mlx_vector_array_free(dependencies) }
+    mlx_depends(&result, inputs, dependencies)
+
+    return mlx_vector_array_values(result)
+}
+
+/// Quantization modes for weight compression in neural networks.
+///
+/// Quantization reduces the precision of model weights to decrease memory usage and
+/// potentially improve inference speed. Different modes use different strategies for
+/// mapping full-precision values to lower-precision representations.
+/// Mode de quantification pour la compression des poids de réseaux de neurones.
+///
+/// Quantization reduces the precision of model weights to decrease memory usage and
+/// potentially improve inference speed. Different modes use different strategies for
+/// mapping full-precision values to lower-precision representations.
+///
+/// ## Utilisation
+///
+/// ```swift
+/// // Mode affine avec paramètres par défaut (groupSize: 64, bits: 4)
+/// let mode = QuantizationMode.affine()
+///
+/// // Mode affine avec paramètres personnalisés
+/// let mode = QuantizationMode.affine(groupSize: 32, bits: 8)
+///
+/// // Mode MXFP4 (paramètres fixes : groupSize = 32, bits = 4)
+/// let mode = QuantizationMode.mxfp4
+/// ```
+public enum QuantizationMode: Equatable, Sendable {
+    /// Affine (linear) quantization with configurable group size and bit width.
+    ///
+    /// This is the standard quantization approach where values are quantized using:
+    /// ```
+    /// quantized_value = round((value - bias) / scale)
+    /// dequantized_value = quantized_value * scale + bias
+    /// ```
+    ///
+    /// The `scale` and `bias` parameters are computed per group of `groupSize` elements
+    /// to minimize quantization error. This mode provides good compression with reasonable
+    /// accuracy preservation for most neural network weights.
+    ///
+    /// - Parameters:
+    ///   - groupSize: Number of elements per quantization group. Default is 64.
+    ///   - bits: Number of bits per quantized element. Default is 4.
+    case affine(groupSize: Int = 64, bits: Int = 4)
+
+    /// MX (Microscaling) FP4 quantization format.
+    ///
+    /// Fixed parameters: groupSize = 32, bits = 4.
+    ///
+    /// ### See Also
+    /// - https://www.opencompute.org/documents/ocp-microscaling-formats-mx-v1-0-spec-final-pdf
+    case mxfp4
+
+    /// MX (Microscaling) FP8 quantization format.
+    ///
+    /// Fixed parameters: groupSize = 32, bits = 8.
+    ///
+    /// ### See Also
+    /// - https://www.opencompute.org/documents/ocp-microscaling-formats-mx-v1-0-spec-final-pdf
+    case mxfp8
+
+    /// NVIDIA FP4 quantization format.
+    case nvfp4
+
+    /// Nom de la valeur transmis à l'API C sous-jacente.
+    var cName: String {
+        switch self {
+        case .affine:
+            return "affine"
+        case .mxfp4:
+            return "mxfp4"
+        case .mxfp8:
+            return "mxfp8"
+        case .nvfp4:
+            return "nvfp4"
+        }
+    }
+
+    /// Taille de groupe effective pour ce mode de quantification.
+    ///
+    /// Pour `.affine`, retourne la valeur de l'argument associé.
+    /// Pour les modes MX/NV, la valeur est fixe selon le format.
+    public var groupSize: Int {
+        switch self {
+        case .affine(let groupSize, _):
+            return groupSize
+        case .mxfp4, .nvfp4:
+            return 32
+        case .mxfp8:
+            return 32
+        }
+    }
+
+    /// Nombre de bits par élément pour ce mode de quantification.
+    ///
+    /// Pour `.affine`, retourne la valeur de l'argument associé.
+    /// Pour les modes MX/NV, la valeur est fixe selon le format.
+    public var bits: Int {
+        switch self {
+        case .affine(_, let bits):
+            return bits
+        case .mxfp4, .nvfp4:
+            return 4
+        case .mxfp8:
+            return 8
+        }
+    }
+}
+
+extension QuantizationMode: Codable {
+    /// Clés de codage pour la sérialisation JSON.
+    private enum CodingKeys: String, CodingKey {
+        case type
+        case groupSize
+        case bits
+    }
+
+    public init(from decoder: Decoder) throws {
+        let container = try decoder.container(keyedBy: CodingKeys.self)
+        let type = try container.decode(String.self, forKey: .type)
+        switch type {
+        case "affine":
+            let groupSize = try container.decodeIfPresent(Int.self, forKey: .groupSize) ?? 64
+            let bits = try container.decodeIfPresent(Int.self, forKey: .bits) ?? 4
+            self = .affine(groupSize: groupSize, bits: bits)
+        case "mxfp4":
+            self = .mxfp4
+        case "mxfp8":
+            self = .mxfp8
+        case "nvfp4":
+            self = .nvfp4
+        default:
+            throw DecodingError.dataCorruptedError(
+                forKey: .type, in: container,
+                debugDescription: "Valeur inconnue pour QuantizationMode : \(type)")
+        }
+    }
+
+    public func encode(to encoder: Encoder) throws {
+        var container = encoder.container(keyedBy: CodingKeys.self)
+        switch self {
+        case .affine(let groupSize, let bits):
+            try container.encode("affine", forKey: .type)
+            try container.encode(groupSize, forKey: .groupSize)
+            try container.encode(bits, forKey: .bits)
+        case .mxfp4:
+            try container.encode("mxfp4", forKey: .type)
+        case .mxfp8:
+            try container.encode("mxfp8", forKey: .type)
+        case .nvfp4:
+            try container.encode("nvfp4", forKey: .type)
+        }
+    }
+}
+
+/// Dequantize the matrix `w` using the provided `scales` and
+/// `biases` and the `group_size` and `bits` configuration.
+///
+/// For details, please see
+/// [this documentation](https://ml-explore.github.io/mlx/build/html/python/_autosummary/mlx.core.dequantize.html)
+///
+/// - Parameters:
+///   - w: The quantized weight matrix to dequantize
+///   - scales: Scaling factors used during quantization. Should have shape compatible with the quantized groups
+///   - biases: Bias values used during quantization. Should have shape compatible with the quantized groups
+///   - groupSize: The size of each quantization group. Elements are quantized in groups of this size. Default is 64
+///   - bits: The number of bits used per quantized element. Default is 4
+///   - mode: The quantization mode used. Either `.affine` for standard affine quantization or `.mxfp4` for MXFP4 format. Default is `.affine`
+///   - globalScale: The per-input float32 scale used for  ``QuantizationMode/nvfp4``
+///   - dtype: data type of the output.  If not specified it will be inferred from the scales and biases.
+///   - stream: Stream or device to evaluate on
+///
+/// ### See Also
+/// - ``quantized(_:groupSize:bits:mode:globalScale:stream:)``
+/// - ``quantizedMM(_:_:scales:biases:transpose:groupSize:bits:mode:stream:)``
+public func dequantized(
+    _ w: MLXArray,
+    scales: MLXArray, biases: MLXArray?,
+    groupSize: Int? = nil, bits: Int? = nil, mode: QuantizationMode = .affine(),
+    globalScale: MLXArray? = nil,
+    dtype: DType? = nil,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    let gs = mlx_optional_int(value: Int32(groupSize ?? 0), has_value: groupSize != nil)
+    let bits = mlx_optional_int(value: Int32(bits ?? 0), has_value: bits != nil)
+    let dtype = mlx_optional_dtype(value: dtype?.cmlxDtype ?? MLX_FLOAT16, has_value: dtype != nil)
+    mlx_dequantize(
+        &result, w.ctx,
+        scales.ctx, (biases ?? .mlxNone).ctx, gs, bits, mode.cName,
+        (globalScale ?? .mlxNone).ctx,
+        dtype,
+        stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise division.
+///
+/// Divide two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = MLXArray([4, 5, 6])
+///
+/// let r = a / b / 7
+/// ```
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``divmod(_:_:stream:)``
+public func divide(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_divide(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise quotient and remainder.
+///
+/// The fuction `divmod(a, b)` is equivalent to but faster than
+/// `(a // b, a % b)`. The function uses numpy-style broadcasting
+/// semantics. Either or both input arrays can also be scalars.
+///
+/// - Parameters:
+///   - a: input array or scalar
+///   - b: input array or scalar
+///   - stream: stream or device to evaluate on
+/// - Returns: The quotient `a / b` and remainder `a % b`
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``divide(_:_:stream:)``
+/// - ``remainder(_:_:stream:)``
+public func divmod(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> (MLXArray, MLXArray) {
+    let (a, b) = toArrays(a, b)
+    var vec = mlx_vector_array_new()
+    mlx_divmod(&vec, a.ctx, b.ctx, stream.ctx)
+    defer { mlx_vector_array_free(vec) }
+    let result = mlx_vector_array_values(vec)
+    return (result[0], result[1])
+}
+
+/// Perform the Einstein summation convention on the operands.
+///
+/// - Parameters:
+///   - subscripts: Einstein summation convention equation
+///   - operands: input arrays
+///   - stream: stream or device to evaluate on
+public func einsum(_ subscripts: String, _ operands: MLXArray..., stream: StreamOrDevice = .default)
+    -> MLXArray
+{
+    einsum(subscripts, operands: operands, stream: stream)
+}
+
+/// Perform the Einstein summation convention on the operands.
+///
+/// - Parameters:
+///   - subscripts: Einstein summation convention equation
+///   - operands: input arrays
+///   - stream: stream or device to evaluate on
+public func einsum(
+    _ subscripts: String, operands: some Collection<MLXArray>, stream: StreamOrDevice = .default
+)
+    -> MLXArray
+{
+    let operands = new_mlx_vector_array(operands)
+    defer { mlx_vector_array_free(operands) }
+
+    var result = mlx_array_new()
+    mlx_einsum(&result, subscripts, operands, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise equality.
+///
+/// Equality comparison on two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = a + 1
+///
+/// if (a .== b).all().item() {
+///     ...
+/// }
+/// ```
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:logical>
+public func equal(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_equal(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise error function.
+///
+/// For details, please see
+/// [this documentation](https://ml-explore.github.io/mlx/build/html/python/_autosummary/mlx.core.erf.html)
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``erfInverse(_:stream:)``
+public func erf(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_erf(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise inverse of ``erf(_:stream:)``.
+///
+/// For details, please see
+/// [this documentation](https://ml-explore.github.io/mlx/build/html/python/_autosummary/mlx.core.erf.html)
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``erf(_:stream:)``
+public func erfInverse(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_erfinv(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Add a size one dimension at the given axis.
+///
+/// - Parameters:
+///     - array: input array
+///     - axes: indexes of the inserted dimensions
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:shapes>
+/// - ``expandedDimensions(_:axis:stream:)``
+public func expandedDimensions(
+    _ array: MLXArray, axes: some Collection<Int>, stream: StreamOrDevice = .default
+)
+    -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_expand_dims_axes(&result, array.ctx, axes.asInt32, axes.count, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Add a size one dimension at the given axis.
+///
+/// - Parameters:
+///     - array: input array
+///     - axis: index of the inserted dimension
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:shapes>
+/// - ``expandedDimensions(_:axes:stream:)``
+public func expandedDimensions(_ array: MLXArray, axis: Int, stream: StreamOrDevice = .default)
+    -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_expand_dims_axes(&result, array.ctx, [axis.int32], 1, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise exponential minus 1.
+///
+/// Computes `exp(x) - 1` with greater precision for small `x`.
+///
+/// - Parameters:
+///   - array: input array
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``exp(_:stream:)``
+public func expm1(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_expm1(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+@available(*, deprecated, renamed: "gatherMM(_:_:lhsIndices:rhsIndices:sortedIndices:stream:)")
+public func gatherMatmul(
+    _ a: MLXArray, _ b: MLXArray, lhsIndices: MLXArray? = nil, rhsIndices: MLXArray? = nil,
+    sortedIndices: Bool = false, stream: StreamOrDevice = .default
+) -> MLXArray {
+    gatherMM(
+        a, b,
+        lhsIndices: lhsIndices, rhsIndices: rhsIndices,
+        sortedIndices: sortedIndices,
+        stream: stream)
+}
+
+/// Matrix multiplication with matrix-level gather.
+///
+/// Performs a gather of the operands with the given indices followed by a
+/// (possibly batched) matrix multiplication of two arrays.  This operation
+/// is more efficient than explicitly applying a `take` followed by a
+/// `matmul`.
+///
+/// The indices `lhsIndices` and `rhsIndices` contain flat indices
+/// along the batch dimensions (i.e. all but the last two dimensions) of
+/// `a` and `b` respectively.
+///
+/// For `a` with shape `(A1, A2, ..., AS, M, K)`, `lhsIndices`
+/// contains indices from the range `[0, A1 * A2 * ... * AS)`
+///
+/// For `b` with shape `(B1, B2, ..., BS, M, K)`, `rhsIndices`
+/// contains indices from the range `[0, B1 * B2 * ... * BS)`
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``matmul(_:_:stream:)``
+public func gatherMM(
+    _ a: MLXArray, _ b: MLXArray, lhsIndices: MLXArray? = nil, rhsIndices: MLXArray? = nil,
+    sortedIndices: Bool = false, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+
+    mlx_gather_mm(
+        &result, a.ctx, b.ctx, (lhsIndices ?? .mlxNone).ctx, (rhsIndices ?? .mlxNone).ctx,
+        sortedIndices, stream.ctx)
+
+    return MLXArray(result)
+}
+
+@available(
+    *, deprecated,
+    renamed:
+        "gatherQuantizedMM(_:_:scales:biases:lhsIndices:rhsIndices:transpose:groupSize:bits:mode:sortedIndices:stream:)"
+)
+public func gatherQuantizedMatmul(
+    _ x: MLXArray, _ w: MLXArray, scales: MLXArray, biases: MLXArray?,
+    lhsIndices: MLXArray? = nil, rhsIndices: MLXArray? = nil,
+    transpose: Bool = true, groupSize: Int? = nil, bits: Int? = nil,
+    mode: QuantizationMode = .affine(),
+    sortedIndices: Bool = false,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    gatherQuantizedMM(
+        x, w, scales: scales, biases: biases,
+        lhsIndices: lhsIndices, rhsIndices: rhsIndices,
+        transpose: transpose,
+        groupSize: groupSize, bits: bits, mode: mode,
+        sortedIndices: sortedIndices,
+        stream: stream)
+}
+
+/// Perform quantized matrix multiplication with matrix-level gather.
+///
+/// This operation is the quantized equivalent to ``gatherMM(_:_:lhsIndices:rhsIndices:sortedIndices:stream:)``
+///
+/// Note that `scales` and `biases` must have the same batch dimensions
+/// as `w` since they represent the same quantized matrix.
+///
+/// - Parameters:
+///   - x: The input matrix
+///   - w: The quantized weight matrix to be used in the matrix multiplication
+///   - scales: The scales to use per `groupSize` elements of `w`
+///   - biases: The biases to use per `groupSize` elements of `w`
+///   - lhsIndices: Optional indices for gathering from the left-hand side matrix
+///   - rhsIndices: Optional indices for gathering from the right-hand side matrix
+///   - transpose: Whether to transpose the weight matrix `w`. Default is `true`
+///   - groupSize: The size of the group in `w` that shares a scale and bias. Default is `64`
+///   - bits: The number of bits occupied by each element in `w`. Default is `4`
+///   - mode: The quantization mode. Default is `.affine`
+///   - sortedIndices: Whether the indices are sorted. Default is `false`
+///   - stream: Stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``quantizedMM(_:_:scales:biases:transpose:groupSize:bits:mode:stream:)``
+public func gatherQuantizedMM(
+    _ x: MLXArray, _ w: MLXArray, scales: MLXArray, biases: MLXArray?,
+    lhsIndices: MLXArray? = nil, rhsIndices: MLXArray? = nil,
+    transpose: Bool = true, groupSize: Int? = nil, bits: Int? = nil,
+    mode: QuantizationMode = .affine(),
+    sortedIndices: Bool = false,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+
+    let gs = mlx_optional_int(value: Int32(groupSize ?? 0), has_value: groupSize != nil)
+    let bits = mlx_optional_int(value: Int32(bits ?? 0), has_value: bits != nil)
+
+    mlx_gather_qmm(
+        &result,
+        x.ctx, w.ctx, scales.ctx, (biases ?? .mlxNone).ctx, (lhsIndices ?? .mlxNone).ctx,
+        (rhsIndices ?? .mlxNone).ctx, transpose,
+        gs, bits, mode.cName, sortedIndices,
+        stream.ctx)
+
+    return MLXArray(result)
+}
+
+/// Element-wise greater than.
+///
+/// Greater than on two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = a + 1
+///
+/// if (a .> b).all().item() {
+///     ...
+/// }
+/// ```
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:logical>
+public func greater(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_greater(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise less greater than or equal.
+///
+/// Greater than or equal on two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = a + 1
+///
+/// if (a .>= b).all().item() {
+///     ...
+/// }
+/// ```
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:logical>
+public func greaterEqual(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_greater_equal(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Perform the Walsh-Hadamard transform along the final axis.
+///
+/// Supports sizes `n = m*2^k` for `m` in `(1, 12, 20, 28)` and `2^k <= 8192`
+/// for ``DType/float32`` and `2^k <= 16384` for ``DType/float16`` and ``DType/bfloat16``.
+///
+/// - Parameters:
+///   - array: input array
+///   - scale: scale the output by this factor -- default is `1.0/sqrt(array.dim(-1))`
+///   - stream: stream to evaluate on
+public func hadamardTransform(
+    _ array: MLXArray, scale: Float? = nil, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let scale = mlx_optional_float(value: scale ?? 0, has_value: scale != nil)
+    var result = mlx_array_new()
+    mlx_hadamard_transform(&result, array.ctx, scale, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Return the Hamming window.
+///
+/// The Hamming window is a taper formed by using a weighted cosine.
+///
+/// - Parameters:
+///   - m: number of points in the output window
+///   - stream: stream to evaluate on
+/// - Returns: The window, with the maximum value normalized to one (the value one appears only if
+///     the number of samples is odd).
+public func hamming(
+    _ m: Int, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_hamming(&result, Int32(m), stream.ctx)
+    return MLXArray(result)
+}
+
+/// Return the Hanning window.
+///
+/// The Hanning window is a taper formed by using a weighted cosine.
+///
+/// - Parameters:
+///   - m: number of points in the output window
+///   - stream: stream to evaluate on
+/// - Returns: The window, with the maximum value normalized to one (the value one appears only if
+///     the number of samples is odd).
+public func hanning(
+    _ m: Int, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_hanning(&result, Int32(m), stream.ctx)
+    return MLXArray(result)
+}
+
+/// Ordinary inner product of vectors for 1-D arrays, in higher dimensions a sum product over the last axes.
+///
+/// - Parameters:
+///   - a: input array
+///   - b: input array
+///   - stream: stream or device to evaluate on
+/// - Returns: inner product
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func inner(
+    _ a: MLXArray, _ b: MLXArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_inner(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Returns a boolean array where two arrays are element-wise equal within a tolerance.
+///
+/// Infinite values are considered equal if they have the same sign, NaN values are not equal unless
+/// `equalNAN` is `true`.
+///
+/// Two values are considered close if:
+///
+/// ```swift
+/// abs(a - b) <= (atol + rtol * abs(b))
+/// ```
+///
+/// Unlike ``arrayEqual(_:_:equalNAN:stream:)`` this function supports <doc:broadcasting>.
+///
+/// - Parameters:
+///   - a: input array
+///   - b: input array
+///   - rtol: relative tolerance (see discussion)
+///   - atol: absolute tolerance (see discussion)
+///   - equalNaN: if `true` treat NaN values as equal to each other
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - ``allClose(_:_:rtol:atol:equalNaN:stream:)``
+/// - ``arrayEqual(_:_:equalNAN:stream:)``
+public func isClose(
+    _ a: MLXArray, _ b: MLXArray, rtol: Double = 1e-5, atol: Double = 1e-8, equalNaN: Bool = false,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_isclose(&result, a.ctx, b.ctx, rtol, atol, equalNaN, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Return a boolean array indicating which elements are NaN.
+///
+/// - Parameters:
+///   - array: input array
+///   - stream: stream or device to evaluate on
+/// - Returns: The boolean array indicating which elements are NaN.
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func isNaN(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_isnan(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Return a boolean array indicating which elements are infinity.
+///
+/// - Parameters:
+///   - array: input array
+///   - stream: stream or device to evaluate on
+/// - Returns: The boolean array indicating which elements are infinity.
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func isInf(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_isinf(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Return a boolean array indicating which elements are finite.
+///
+/// - Parameters:
+///   - array: input array
+///   - stream: stream or device to evaluate on
+/// - Returns: The boolean array indicating which elements are infinity.
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func isFinite(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_isfinite(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Return a boolean array indicating which elements are negative infinity.
+///
+/// - Parameters:
+///   - array: input array
+///   - stream: stream or device to evaluate on
+/// - Returns: The boolean array indicating which elements are negative infinity.
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func isNegInf(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_isneginf(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Return a boolean array indicating which elements are positive infinity.
+///
+/// - Parameters:
+///   - array: input array
+///   - stream: stream or device to evaluate on
+/// - Returns: The boolean array indicating which elements are positive infinity.
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func isPosInf(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_isposinf(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise less than.
+///
+/// Less than on two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = a + 1
+///
+/// if (a .< b).all().item() {
+///     ...
+/// }
+/// ```
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:logical>
+public func less(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_less(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise less than or equal.
+///
+/// Less than or equal on two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = a + 1
+///
+/// if (a .<= b).all().item() {
+///     ...
+/// }
+/// ```
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:logical>
+public func lessEqual(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_less_equal(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise log-add-exp.
+///
+/// This is a numerically stable log-add-exp of two arrays with numpy-style
+/// broadcasting semantics. Either or both input arrays can also be scalars.
+///
+/// The computation is is a numerically stable version of `log(exp(a) + exp(b))`.
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func logAddExp(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_logaddexp(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise logical and.
+///
+/// Logical and on two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = a + 1
+///
+/// // equivalent
+/// let r = (a .< b) .&& ((a + 1) .> b)
+/// let r2 = logicalAnd((a .< b), ((a + 1) .> b))
+/// ```
+///
+/// - Parameters:
+///   - a: input array or scalar
+///   - b: input array or scalar
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - <doc:logical>
+/// - ``MLXArray/.&&(_:_:)``
+public func logicalAnd(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_logical_and(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise logical not.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = a + 1
+/// let r = !(a == b)
+/// ```
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - <doc:logical>
+public func logicalNot(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_logical_not(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise logical or.
+///
+/// Logical or on two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = a + 1
+///
+/// // equivalent
+/// let r = (a .< b) .|| ((a + 1) .> b)
+/// let r2 = logicalOr((a .< b), ((a + 1) .> b))
+/// ```
+///
+/// - Parameters:
+///   - a: input array or scalar
+///   - b: input array or scalar
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - <doc:logical>
+/// - ``MLXArray/.||(_:_:)``
+public func logicalOr(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_logical_or(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Indexing mode for ``meshGrid(_:sparse:indexing:stream:)``.
+public enum MeshGridIndexing: String, Sendable {
+    /// cartesian indexing
+    case xy
+
+    /// matrix indexing
+    case ij
+}
+
+/// Generate multidimensional coordinate grids from 1-D coordinate arrays
+///
+/// - Parameters:
+///   - arrays: input arrays
+///   - sparse: if `true` a sparse grid is returned in which each output array has a single
+///     non-zero element, otherwise a dense grid is returned.
+///   - indexing: indexing mode
+///   - stream: stream or device to evaluate on
+public func meshGrid(
+    _ arrays: some Collection<MLXArray>, sparse: Bool = false, indexing: MeshGridIndexing = .xy,
+    stream: StreamOrDevice = .default
+) -> [MLXArray] {
+    let mlxArrays = new_mlx_vector_array(arrays)
+    defer { mlx_vector_array_free(mlxArrays) }
+
+    var vec = mlx_vector_array_new()
+
+    mlx_meshgrid(&vec, mlxArrays, sparse, indexing.rawValue.cString(using: .utf8), stream.ctx)
+    defer { mlx_vector_array_free(vec) }
+
+    return mlx_vector_array_values(vec)
+}
+
+/// Element-wise maximum.
+///
+/// Take the element-wise max of two arrays with <doc:broadcasting>
+/// semantics.
+///
+/// - Parameters:
+///     - a: the first array
+///     - b: the second array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``minimum(_:_:stream:)``
+public func maximum(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_maximum(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Compute the median(s) over the given axis.
+///
+/// - Parameters:
+///     - a: the first array
+///     - axis: axis to reduce over
+///     - keepDims: if `true` keep reduced axis as singleton dimension
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:reduction>
+public func median(
+    _ a: MLXArray, axis: Int, keepDims: Bool = false,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_median(&result, a.ctx, [axis.int32], 1, keepDims, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Compute the median(s) over the given axes.
+///
+/// - Parameters:
+///     - a: the first array
+///     - axes: axes to reduce over
+///     - keepDims: if `true` keep reduced axis as singleton dimension
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:reduction>
+public func median(
+    _ a: MLXArray, axes: [Int], keepDims: Bool = false,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_median(&result, a.ctx, axes.asInt32, axes.count, keepDims, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Compute the median(s) over the full array.
+///
+/// - Parameters:
+///     - a: the first array
+///     - keepDims: if `true` keep reduced axis as singleton dimension
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:reduction>
+public func median(
+    _ a: MLXArray, keepDims: Bool = false,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_median(&result, a.ctx, nil, 0, keepDims, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise minimum.
+///
+/// Take the element-wise min of two arrays with <doc:broadcasting>
+/// semantics.
+///
+/// - Parameters:
+///     - a: the first array
+///     - b: the second array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``maximum(_:_:stream:)``
+public func minimum(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_minimum(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise multiplication.
+///
+/// Multiply two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = MLXArray([4, 5, 6])
+///
+/// let r = a * b * 7
+/// ```
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func multiply(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_multiply(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Replace NaN and Inf values with finite numbers.
+///
+/// - Parameters:
+///   - array: input array
+///   - nan: value to replace NaN with
+///   - posInf: value to replace positive inifinites with.  If not specified will use
+///     the largest finite value for the given dtype.
+///   - negInf: value to replace negative inifinites with.  If not specified will use
+///     the negative of the largest finite value for the given dtype.
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func nanToNum(
+    _ array: MLXArray,
+    nan: Float = 0, posInf: Float? = 0, negInf: Float? = 0,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    let posInf = mlx_optional_float(value: posInf ?? 0, has_value: posInf != nil)
+    let negInf = mlx_optional_float(value: negInf ?? 0, has_value: negInf != nil)
+    var result = mlx_array_new()
+    mlx_nan_to_num(&result, array.ctx, nan, posInf, negInf, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise negation.
+///
+/// Negate the values in the array.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let r = negative(a) // e.g. -a
+/// ```
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func negative(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_negative(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise not equal.
+///
+/// Not equal on two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = a + 1
+///
+/// // equivalent to if (a .!= b).all().item() {
+/// if notEqual(a, b).all().item() {
+///     ...
+/// }
+/// ```
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:logical>
+public func notEqual(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_not_equal(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Compute the outer product of two 1-D arrays, if the array's passed are not 1-D a flatten op will be run beforehand.
+///
+/// - Parameters:
+///   - a: input array
+///   - b: input array
+///   - stream: stream or device to evaluate on
+/// - Returns: outer product
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func outer(
+    _ a: MLXArray, _ b: MLXArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_outer(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Mode for ``padded(_:width:mode:value:stream:)``
+public enum PadMode: String {
+    /// pads with constant value
+    case constant
+    /// pads with the edge values of the array
+    case edge
+}
+
+/// Pad an array with a constant value.
+///
+/// - Parameters:
+///     - array: the array to pad
+///     - width: either an `Int` number of values to pad before AND after each axis or an array of 2 giving the
+///             before and after counts
+///     - mode: padding mode, see ``PadMode``
+///     - value: constant value to pad the edges with
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:shapes>
+/// - ``padded(_:widths:mode:value:stream:)``
+public func padded(
+    _ array: MLXArray, width: IntOrPair, mode: PadMode = .constant, value: MLXArray? = nil,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    let ndim = array.ndim
+    let axes = Array(Int32(0) ..< Int32(ndim))
+    let lowPads = (0 ..< ndim).map { _ in width.first.int32 }
+    let highPads = (0 ..< ndim).map { _ in width.second.int32 }
+    let value = value ?? MLXArray(0, dtype: array.dtype)
+
+    var result = mlx_array_new()
+    mlx_pad(
+        &result,
+        array.ctx, axes, ndim, lowPads, ndim, highPads, ndim, value.ctx,
+        mode.cName.cString(using: .utf8), stream.ctx)
+    return MLXArray(result)
+}
+
+/// Pad an array with a constant value.
+///
+/// - Parameters:
+///     - array: the array to pad
+///     - widths: array of int or pairs giving the before/after amounts for each axis
+///     - mode: padding mode, see ``PadMode``
+///     - value: constant value to pad the edges with
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:shapes>
+/// - ``padded(_:width:mode:value:stream:)``
+public func padded(
+    _ array: MLXArray, widths: some Collection<IntOrPair>, mode: PadMode = .constant,
+    value: MLXArray? = nil,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    let ndim = array.ndim
+    let axes = Array(Int32(0) ..< Int32(ndim))
+    let lowPads = widths.map { $0.first.int32 }
+    let highPads = widths.map { $0.second.int32 }
+    let value = value ?? MLXArray(0, dtype: array.dtype)
+
+    var result = mlx_array_new()
+    mlx_pad(
+        &result,
+        array.ctx, axes, ndim, lowPads, ndim, highPads, ndim, value.ctx,
+        mode.cName.cString(using: .utf8), stream.ctx)
+    return MLXArray(result)
+}
+
+/// Returns a partitioned copy of the array such that the smaller `kth`
+/// elements are first.
+///
+/// The ordering of the elements in partitions is undefined.
+///
+/// - Parameters:
+///     - array: input array
+///     - kth: Element at the `kth` index will be in its sorted
+///                   position in the output. All elements before the kth index will
+///                   be less or equal to the `kth` element and all elements after
+///                   will be greater or equal to the `kth` element in the output.
+///     - axis: axis to partition over
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:sorting>
+/// - ``partitioned(_:kth:stream:)``
+/// - ``argPartition(_:kth:axis:stream:)``
+public func partitioned(_ array: MLXArray, kth: Int, axis: Int, stream: StreamOrDevice = .default)
+    -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_partition_axis(&result, array.ctx, kth.int32, axis.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+///
+/// Returns a partitioned copy of the flattened array such that the smaller `kth`
+/// elements are first.
+///
+/// The ordering of the elements in partitions is undefined.
+///
+/// - Parameters:
+///     - array: input array
+///     - kth: Element at the `kth` index will be in its sorted
+///                   position in the output. All elements before the kth index will
+///                   be less or equal to the `kth` element and all elements after
+///                   will be greater or equal to the `kth` element in the output.
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:sorting>
+/// - ``partitioned(_:kth:axis:stream:)``
+/// - ``argPartition(_:kth:axis:stream:)``
+public func partitioned(_ array: MLXArray, kth: Int, stream: StreamOrDevice = .default) -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_partition(&result, array.ctx, kth.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Put values along an axis at the specified indices.
+///
+/// - Parameters:
+///     - array: destination array
+///     - indices: Indices array. These should be broadcastable with the input array excluding the `axis` dimension.
+///     - values: Values array. These should be broadcastable with the indices.
+///     - axis: Axis in the destination to put the values to
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:indexes>
+/// - ``takeAlong(_:_:stream:)``
+public func putAlong(
+    _ array: MLXArray, _ indices: MLXArray, values: MLXArray, axis: Int,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_put_along_axis(&result, array.ctx, indices.ctx, values.ctx, axis.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Put values along an axis at the specified indices in a flattened array.
+///
+/// - Parameters:
+///     - array: destination array
+///     - indices: Indices array. These should be broadcastable with the flattened input array
+///     - values: Values array. These should be broadcastable with the flattened input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:indexes>
+/// - ``takeAlong(_:_:axis:stream:)
+public func putAlong(
+    _ array: MLXArray, _ indices: MLXArray, values: MLXArray, stream: StreamOrDevice = .default
+)
+    -> MLXArray
+{
+    let input = array.reshaped([-1], stream: stream)
+    var result = mlx_array_new()
+    mlx_put_along_axis(&result, input.ctx, indices.ctx, values.ctx, 0, stream.ctx)
+    return MLXArray(result).reshaped(array.shape, stream: stream)
+}
+
+/// Quantize the matrix `w` using `bits` bits per element.
+///
+/// Note, every `group_size` elements in a row of `w` are quantized
+/// together. Hence, number of columns of `w` should be divisible by
+/// `group_size`. In particular, the rows of `w` are divided into groups of
+/// size `group_size` which are quantized together.
+///
+/// > `quantized` currently only supports 2D inputs with dimensions which are multiples of 32
+///
+/// - Parameters:
+///   - w: Matrix to be quantized
+///   - groupSize: The size of the group in `w` that shares a scale and bias. Default is `64`
+///   - bits: The number of bits occupied by each element of `w` in the returned quantized matrix. Default is `4`
+///   - mode: The quantization mode. Default is `.affine`
+///   - globalScale: The per-input float32 scale used for  ``QuantizationMode/nvfp4``
+///   - stream: Stream or device to evaluate on
+/// - Returns: A tuple containing the quantized weights (`wq`), scaling factors (`scales`), and bias values (`biases`).
+///     Note that `biases` may be nil in for some `mode`.
+///
+/// For details, please see
+/// [this documentation](https://ml-explore.github.io/mlx/build/html/python/_autosummary/mlx.core.quantize.html)
+///
+/// ### See Also
+/// - ``dequantized(_:scales:biases:groupSize:bits:mode:globalScale:dtype:stream:)``
+/// - ``quantizedMM(_:_:scales:biases:transpose:groupSize:bits:mode:stream:)``
+public func quantized(
+    _ w: MLXArray,
+    groupSize: Int? = nil, bits: Int? = nil,
+    mode: QuantizationMode = .affine(),
+    globalScale: MLXArray? = nil,
+    stream: StreamOrDevice = .default
+) -> (wq: MLXArray, scales: MLXArray, biases: MLXArray?) {
+    var r = mlx_vector_array_new()
+    defer { mlx_vector_array_free(r) }
+
+    let gs = mlx_optional_int(value: Int32(groupSize ?? 0), has_value: groupSize != nil)
+    let bits = mlx_optional_int(value: Int32(bits ?? 0), has_value: bits != nil)
+
+    mlx_quantize(
+        &r, w.ctx, gs, bits, mode.cName,
+        (globalScale ?? .mlxNone).ctx,
+        stream.ctx)
+
+    let arrays = mlx_vector_array_values(r)
+    return (arrays[0], arrays[1], arrays.count > 2 ? arrays[2] : nil)
+}
+
+@available(
+    *, deprecated, renamed: "quantizedMM(_:_:scales:biases:transpose:groupSize:bits:mode:stream:)"
+)
+public func quantizedMatmul(
+    _ x: MLXArray, _ w: MLXArray, scales: MLXArray, biases: MLXArray?,
+    transpose: Bool = true,
+    groupSize: Int? = nil, bits: Int? = nil,
+    mode: QuantizationMode = .affine(),
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    quantizedMM(
+        x, w, scales: scales, biases: biases,
+        transpose: transpose,
+        groupSize: groupSize, bits: bits, mode: mode,
+        stream: stream)
+}
+
+/// Perform the matrix multiplication with the quantized matrix `w`. The
+/// quantization uses one floating point scale and bias per `group_size` of
+/// elements. Each element in `w` takes `bits` bits and is packed in an
+/// unsigned 32 bit integer.
+///
+/// - Parameters:
+///   - x: Input array
+///   - w: Quantized matrix packed in unsigned integers
+///   - scales: The scales to use per `groupSize` elements of `w`
+///   - biases: The biases to use per `groupSize` elements of `w`
+///   - transpose: Defines whether to multiply with the transposed `w` or not,
+///     namely whether we are performing `x @ w.T` or `x @ w`. Default is `true`
+///   - groupSize: The size of the group in `w` that shares a scale and bias. Default is `64`
+///   - bits: The number of bits occupied by each element in `w`. Default is `4`
+///   - mode: The quantization mode. Default is `.affine`
+///   - stream: Stream or device to evaluate on
+///
+/// ### See Also
+/// - ``dequantized(_:scales:biases:groupSize:bits:mode:globalScale:dtype:stream:)``
+/// - ``quantized(_:groupSize:bits:mode:globalScale:stream:)``
+public func quantizedMM(
+    _ x: MLXArray, _ w: MLXArray, scales: MLXArray, biases: MLXArray?,
+    transpose: Bool = true,
+    groupSize: Int? = nil, bits: Int? = nil,
+    mode: QuantizationMode = .affine(),
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+
+    let gs = mlx_optional_int(value: Int32(groupSize ?? 0), has_value: groupSize != nil)
+    let bits = mlx_optional_int(value: Int32(bits ?? 0), has_value: bits != nil)
+
+    mlx_quantized_matmul(
+        &result,
+        x.ctx, w.ctx, scales.ctx, (biases ?? .mlxNone).ctx,
+        transpose, gs, bits,
+        mode.cName,
+        stream.ctx
+    )
+    return MLXArray(result)
+}
+
+/// Perform a matrix multiplication using a possibly quantized weight matrix
+/// `w` and a non-quantized input `x`. The input `x` is quantized on the
+/// fly. The weight matrix `w` is used as-is if it is already quantized;
+/// otherwise, it is quantized on the fly.
+///
+/// If `w` is quantized, `scales` must be provided, and `groupSize`,
+/// `bits`, and `mode` must match the parameters that were used to quantize
+/// `w`.
+///
+/// Notes:
+/// - If `w` is expected to receive gradients, it must be provided in
+///   non-quantized form.
+///
+/// - If `x` and `w` are not quantized, their data types must be ``DType/float32``,
+///   ``DType/float16``, or ``DType/bfloat16``.
+///
+/// - If `w` is quantized, it must be packed in unsigned integers.
+///
+/// - Parameters:
+///   - x: input array
+///   - w: weight matrix.  If quantized, it is packed in unsigned integers.
+///   - scales: The scales to use per `groupSize` elements of `w` if `w` is quantized
+///   - groupSize: Number of elements in `x` and `w` that share a scale
+///   - bits: Number of bits used to represent each element of `x` and `w`
+///   - mode: The quantization mode. Default is `.affine`
+///   - globalScaleX: The per-input float32 scale used for `x` with  ``QuantizationMode/nvfp4``
+///   - globalScaleW: The per-input float32 scale used for  `w` with ``QuantizationMode/nvfp4``
+///   - stream: Stream or device to evaluate on
+public func quantizedQuantizedMM(
+    _ x: MLXArray, _ w: MLXArray, scales: MLXArray?,
+    groupSize: Int? = nil, bits: Int? = nil,
+    mode: QuantizationMode = .nvfp4,
+    globalScaleX: MLXArray? = nil,
+    globalScaleW: MLXArray? = nil,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+
+    let gs = mlx_optional_int(value: Int32(groupSize ?? 0), has_value: groupSize != nil)
+    let bits = mlx_optional_int(value: Int32(bits ?? 0), has_value: bits != nil)
+
+    mlx_qqmm(
+        &result,
+        x.ctx, w.ctx, (scales ?? .mlxNone).ctx,
+        gs, bits,
+        mode.cName,
+        (globalScaleX ?? .mlxNone).ctx,
+        (globalScaleW ?? .mlxNone).ctx,
+        stream.ctx
+    )
+    return MLXArray(result)
+}
+
+/// Convert angles from degrees to radians.
+///
+/// - Parameters:
+///   - array: input array
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``degrees(_:stream:)``
+public func radians(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_radians(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise remainder of division.
+///
+/// Computes the remainder of dividing `lhs` with `rhs` with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+///
+/// let r = remainder(a, 2) // e.g. a % 2
+/// ```
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func remainder(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_remainder(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Roll array elements along a given axis.
+///
+/// Elements that are rolled beyond the end of the array are introduced at the beggining and vice-versa.
+///
+/// - Parameters:
+///   - a: input array
+///   - shift: The number of places by which elements
+///     are shifted. If positive the array is rolled to the right, if
+///     negative it is rolled to the left.
+///   - axis: the axis along which to roll the elements
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:shapes>
+public func roll(_ a: MLXArray, shift: Int, axis: Int, stream: StreamOrDevice = .default)
+    -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_roll_axis(&result, a.ctx, [shift.int32], 1, axis.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Roll array elements along a given axis.
+///
+/// Elements that are rolled beyond the end of the array are introduced at the beggining and vice-versa.
+///
+/// - Parameters:
+///   - a: input array
+///   - shift: The number of places by which elements
+///     are shifted. If positive the array is rolled to the right, if
+///     negative it is rolled to the left.
+///   - axes: the axes along which to roll the elements, or all if omitted
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:shapes>
+public func roll(
+    _ a: MLXArray, shift: Int, axes: (some Collection<Int>)? = [Int]?.none,
+    stream: StreamOrDevice = .default
+)
+    -> MLXArray
+{
+    var result = mlx_array_new()
+    if let axes {
+        mlx_roll_axes(&result, a.ctx, [shift.int32], 1, axes.asInt32, axes.count, stream.ctx)
+    } else {
+        mlx_roll(&result, a.ctx, [shift.int32], 1, stream.ctx)
+    }
+    return MLXArray(result)
+}
+
+/// Element-wise logistic sigmoid.
+///
+/// For details, please see
+/// [this documentation](https://ml-explore.github.io/mlx/build/html/python/_autosummary/mlx.core.sigmoid.html)
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func sigmoid(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_sigmoid(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise sign.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func sign(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_sign(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise hyperbolic sine.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``sin(_:stream:)``
+public func sinh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_sinh(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+@available(*, deprecated, renamed: "softmax(_:axes:precise:stream:)")
+@_documentation(visibility: internal)
+public func softMax(
+    _ array: MLXArray, axes: some Collection<Int>, precise: Bool = false,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    softmax(array, axes: axes, precise: precise, stream: stream)
+}
+
+/// Perform the softmax along the given axis.
+///
+/// This operation is a numerically stable version of:
+///
+/// ```swift
+///exp(a) / sum(exp(a), axis, keepdims: true)
+/// ```
+///
+/// - Parameters:
+///     - array: input array
+///     - axes: axes to compute the softmax over
+///     - precise: if true, compute a more precise softmax by scaling the input
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``softmax(_:axis:precise:stream:)``
+/// - ``softmax(_:precise:stream:)``
+public func softmax(
+    _ array: MLXArray, axes: some Collection<Int>, precise: Bool = false,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_softmax_axes(&result, array.ctx, axes.asInt32, axes.count, precise, stream.ctx)
+    return MLXArray(result)
+}
+
+@available(*, deprecated, renamed: "softmax(_:axis:precise:stream:)")
+@_documentation(visibility: internal)
+public func softMax(
+    _ array: MLXArray, axis: Int, precise: Bool = false, stream: StreamOrDevice = .default
+) -> MLXArray {
+    softmax(array, axis: axis, precise: precise, stream: stream)
+}
+
+/// Perform the softmax along the given axis.
+///
+/// This operation is a numerically stable version of:
+///
+/// ```swift
+///exp(a) / sum(exp(a), axis, keepdims: true)
+/// ```
+///
+/// - Parameters:
+///     - array: input array
+///     - axis: axis to compute the softmax over
+///     - precise: if true, compute a more precise softmax by scaling the input
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``softmax(_:axes:precise:stream:)``
+/// - ``softmax(_:precise:stream:)``
+public func softmax(
+    _ array: MLXArray, axis: Int, precise: Bool = false, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_softmax_axis(&result, array.ctx, axis.int32, precise, stream.ctx)
+    return MLXArray(result)
+}
+
+@available(*, deprecated, renamed: "softmax(_:axis:precise:stream:)")
+@_documentation(visibility: internal)
+public func softMax(_ array: MLXArray, precise: Bool = false, stream: StreamOrDevice = .default)
+    -> MLXArray
+{
+    softmax(array, precise: precise, stream: stream)
+}
+
+/// Perform the softmax along the given axis.
+///
+/// This operation is a numerically stable version of:
+///
+/// ```swift
+///exp(a) / sum(exp(a), axis, keepdims: true)
+/// ```
+///
+/// - Parameters:
+///     - array: input array
+///     - precise: if true, compute a more precise softmax by scaling the input
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - ``softmax(_:axes:precise:stream:)``
+/// - ``softmax(_:axis:precise:stream:)``
+public func softmax(_ array: MLXArray, precise: Bool = false, stream: StreamOrDevice = .default)
+    -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_softmax(&result, array.ctx, precise, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Returns a sorted copy of the array.
+///
+/// - Parameters:
+///     - array: input array
+///     - axis: axis to sort over
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:sorting>
+/// - ``sorted(_:stream:)``
+/// - ``argSort(_:axis:stream:)``
+public func sorted(_ array: MLXArray, axis: Int, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_sort_axis(&result, array.ctx, axis.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Returns a sorted copy of the flattened array.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:sorting>
+/// - ``sorted(_:axis:stream:)``
+/// - ``argSort(_:axis:stream:)``
+public func sorted(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_sort(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Compute the standard deviation(s) over the given axes.
+///
+/// - Parameters:
+///   - array: input array
+///   - axes: axes to reduce over
+///   - keepDims: if `true` keep reduced axis as singleton dimension
+///   - ddof: the divisor to compute the varian is `N - ddof`
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:reduction>
+/// - ``std(_:axis:keepDims:ddof:stream:)``
+/// - ``std(_:keepDims:ddof:stream:)``
+public func std(
+    _ array: MLXArray, axes: some Collection<Int>, keepDims: Bool = false, ddof: Int = 0,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_std_axes(&result, array.ctx, axes.asInt32, axes.count, keepDims, ddof.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Compute the standard deviation over the given axis.
+///
+/// - Parameters:
+///   - array: input array
+///   - axis: axis to reduce over
+///   - keepDims: if `true` keep reduced axis as singleton dimension
+///   - ddof: the divisor to compute the varian is `N - ddof`
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:reduction>
+/// - ``std(_:axes:keepDims:ddof:stream:)``
+/// - ``std(_:keepDims:ddof:stream:)``
+public func std(
+    _ array: MLXArray, axis: Int, keepDims: Bool = false, ddof: Int = 0,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_std_axis(&result, array.ctx, axis.int32, keepDims, ddof.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Compute the standard deviations over all axes.
+///
+/// - Parameters:
+///   - array: input array
+///   - keepDims: if `true` keep reduced axis as singleton dimension
+///   - ddof: the divisor to compute the varian is `N - ddof`
+///   - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:reduction>
+/// - ``std(_:axes:keepDims:ddof:stream:)``
+/// - ``std(_:axis:keepDims:ddof:stream:)``
+public func std(
+    _ array: MLXArray, keepDims: Bool = false, ddof: Int = 0, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_std(&result, array.ctx, keepDims, ddof.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Stacks the arrays along a new axis.
+///
+/// ### See Also
+/// - <doc:shapes>
+public func stacked(
+    _ arrays: some Collection<MLXArray>, axis: Int = 0, stream: StreamOrDevice = .default
+)
+    -> MLXArray
+{
+    let vector_array = new_mlx_vector_array(arrays)
+    defer { mlx_vector_array_free(vector_array) }
+    var result = mlx_array_new()
+    mlx_stack_axis(&result, vector_array, axis.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Stop gradients from being computed.
+///
+///The operation is the identity but it prevents gradients from flowing
+/// through the array.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+public func stopGradient(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_stop_gradient(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise subtraction.
+///
+/// Subtract two arrays with <doc:broadcasting>.
+///
+/// For example:
+///
+/// ```swift
+/// let a = MLXArray(0 ..< 12, [4, 3])
+/// let b = MLXArray([4, 5, 6])
+///
+/// let r = subtract(a, b) // e.g. a - b
+/// ```
+///
+/// - Parameters:
+///     - a: the left hand side array
+///     - b: the right hand side array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func subtract(
+    _ a: some ScalarOrArray, _ b: some ScalarOrArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_subtract(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Take values along an axis at the specified indices.
+///
+/// - Parameters:
+///     - array: the left hand side array
+///     - indices: should be broadcastable to `array` excluding the `axis` dimension
+///     - axis: axis in the input to take the values from
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:indexes>
+/// - ``takeAlong(_:_:stream:)``
+public func takeAlong(
+    _ array: MLXArray, _ indices: MLXArray, axis: Int, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_take_along_axis(&result, array.ctx, indices.ctx, axis.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Take values along an axis at the specified indices from a flattened array.
+///
+/// - Parameters:
+///     - array: the left hand side array
+///     - indices: should be broadcastable to the flattened `array`
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:indexes>
+/// - ``takeAlong(_:_:axis:stream:)
+public func takeAlong(_ array: MLXArray, _ indices: MLXArray, stream: StreamOrDevice = .default)
+    -> MLXArray
+{
+    let array = array.reshaped([-1], stream: stream)
+    var result = mlx_array_new()
+    mlx_take_along_axis(&result, array.ctx, indices.ctx, 0, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise tangent.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func tan(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_tan(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Element-wise hyperbolic tangent.
+///
+/// - Parameters:
+///     - array: input array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func tanh(_ array: MLXArray, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_tanh(&result, array.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Compute tensor dot product.
+///
+/// - Parameters:
+///   - a: input array
+///   - b: input array
+///   - axes: sum over the last `axes` dimensions
+///   - stream: stream or device to evaluate on
+/// - Returns: tensor dot product
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``tensordot(_:_:axes:stream:)-(MLXArray,MLXArray,Int,StreamOrDevice)``
+public func tensordot(
+    _ a: MLXArray, _ b: MLXArray, axes: Int = 1, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_tensordot_axis(&result, a.ctx, b.ctx, axes.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Compute tensor dot product.
+///
+/// - Parameters:
+///   - a: input array
+///   - b: input array
+///   - axes: two ranges for the `a` and `b` dimensions
+///   - stream: stream or device to evaluate on
+/// - Returns: tensor dot product
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``tensordot(_:_:axes:stream:)-(MLXArray,MLXArray,((Int,Int),(Int,Int)),StreamOrDevice)``
+public func tensordot(
+    _ a: MLXArray, _ b: MLXArray, axes: ((Int, Int), (Int, Int)), stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_tensordot(
+        &result,
+        a.ctx, b.ctx, [axes.0.0, axes.0.1].asInt32, 2, [axes.1.0, axes.1.1].asInt32, 2,
+        stream.ctx)
+    return MLXArray(result)
+}
+
+/// Compute tensor dot product.
+///
+/// - Parameters:
+///   - a: input array
+///   - b: input array
+///   - axes: multiple ranges for the `a` and `b` dimensions
+///   - stream: stream or device to evaluate on
+/// - Returns: tensor dot product
+///
+/// ### See Also
+/// - <doc:arithmetic>
+/// - ``tensordot(_:_:axes:stream:)``
+public func tensordot(
+    _ a: MLXArray, _ b: MLXArray, axes: (some Collection<Int>, some Collection<Int>),
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_tensordot(
+        &result,
+        a.ctx, b.ctx, axes.0.asInt32, axes.0.count, axes.1.asInt32, axes.1.count,
+        stream.ctx)
+    return MLXArray(result)
+}
+
+/// Construct array by repeating given array the number of times given by `repetitions`.
+///
+/// - Parameters:
+///   - array: input array
+///   - repetitions: number of repetitions for each axis
+///   - stream: stream or device to evaluate on
+/// - Returns: tiled array
+///
+/// ### See Also
+/// - <doc:shapes>
+/// - ``tiled(_:repetitions:stream:)-eouf``
+public func tiled(
+    _ array: MLXArray, repetitions: some Collection<Int>, stream: StreamOrDevice = .default
+)
+    -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_tile(&result, array.ctx, repetitions.asInt32, repetitions.count, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Construct array by repeating given array the number of times given by `repetitions`.
+///
+/// - Parameters:
+///   - array: input array
+///   - repetitions: number of repetitions for all axes
+///   - stream: stream or device to evaluate on
+/// - Returns: tiled array
+///
+/// ### See Also
+/// - <doc:shapes>
+/// - ``tiled(_:repetitions:stream:)-(MLXArray,Int,StreamOrDevice)``
+public func tiled(_ array: MLXArray, repetitions: Int, stream: StreamOrDevice = .default)
+    -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_tile(&result, array.ctx, [repetitions.int32], 1, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Returns the `k` largest elements from the input along a given axis.
+///
+/// The elements will not necessarily be in sorted order.
+///
+/// - Parameters:
+///     - array: input array
+///     - k: how many values
+///     - axis: axis to select over
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:sorting>
+/// - ``top(_:k:stream:)``
+public func top(_ array: MLXArray, k: Int, axis: Int = -1, stream: StreamOrDevice = .default)
+    -> MLXArray
+{
+    var result = mlx_array_new()
+    mlx_topk_axis(&result, array.ctx, k.int32, axis.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Returns the `k` largest elements from the flattened input along a given axis.
+///
+/// The elements will not necessarily be in sorted order.
+///
+/// - Parameters:
+///     - array: input array
+///     - k: how many values
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:sorting>
+/// - ``top(_:k:axis:stream:)``
+public func top(_ array: MLXArray, k: Int, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_topk(&result, array.ctx, k.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Return the sum along a specified diagonal in the given array.
+///
+/// - Parameters:
+///   - array: input array
+///   - offset: Offset of the diagonal from the main diagonal
+///   - axis1: The first axis of the 2-D sub-arrays from which the diagonals should be taken
+///   - axis2: The second axis of the 2-D sub-arrays from which the diagonals should be taken
+///   - dtype: Data type of the output array. If unspecified the output type is inferred from the input array.
+///   - stream: stream or device to evaluate on
+/// - Returns: sum of specified diagonal.
+///
+/// ### See Also
+/// - <doc:arithmetic>
+public func trace(
+    _ array: MLXArray, offset: Int = 0, axis1: Int = 0, axis2: Int = 1, dtype: DType? = nil,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_trace(
+        &result,
+        array.ctx, offset.int32, axis1.int32, axis2.int32, (dtype ?? array.dtype).cmlxDtype,
+        stream.ctx)
+    return MLXArray(result)
+}
+
+/// Zeros the array above the given diagonal.
+///
+/// - Parameters:
+///     - array: input array
+///     - k: the diagonal of the 2-D array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - ``triu(_:k:stream:)``
+public func tril(_ array: MLXArray, k: Int = 0, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_tril(&result, array.ctx, k.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Zeros the array below the given diagonal.
+///
+/// - Parameters:
+///     - array: input array
+///     - k: the diagonal of the 2-D array
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - ``tril(_:k:stream:)``
+public func triu(_ array: MLXArray, k: Int = 0, stream: StreamOrDevice = .default) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_triu(&result, array.ctx, k.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Select from `x` or `y` according to `condition`.
+///
+/// The condition and input arrays must be the same shape or <doc:broadcasting>
+/// with each another.
+///
+/// > ``which(_:_:_:stream:)`` may be easier to use (`where` is a Swift keyword).
+///
+/// - Parameters:
+///     - condition: condition array
+///     - a: input selected from where condiiton is non-zero or `true`
+///     - b: input selected from where condiiton is zero or `false`
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:logical>
+/// - ``which(_:_:_:stream:)``
+public func `where`(
+    _ condition: MLXArray, _ a: some ScalarOrArray, _ b: some ScalarOrArray,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_where(&result, condition.ctx, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Alias for ``where(_:_:_:stream:)`` -- select from `x` or `y` according to `condition`.
+///
+/// The condition and input arrays must be the same shape or <doc:broadcasting>
+/// with each another.
+///
+/// - Parameters:
+///     - condition: condition array
+///     - a: input selected from where condiiton is non-zero or `true`
+///     - b: input selected from where condiiton is zero or `false`
+///     - stream: stream or device to evaluate on
+///
+/// ### See Also
+/// - <doc:logical>
+/// - ``where(_:_:_:stream:)``
+public func which(
+    _ condition: MLXArray, _ a: some ScalarOrArray, _ b: some ScalarOrArray,
+    stream: StreamOrDevice = .default
+) -> MLXArray {
+    let (a, b) = toArrays(a, b)
+    var result = mlx_array_new()
+    mlx_where(&result, condition.ctx, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Compute the Kronecker product of two arrays `a` and `b`.
+///
+/// - Parameters:
+///     - a: input array
+///     - b: input array
+///     - stream: stream or device to evaluate on
+public func kron(
+    _ a: MLXArray, _ b: MLXArray, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_kron(&result, a.ctx, b.ctx, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Flatten an array.
+///
+/// The axes flattened will be between `start_axis` and `end_axis`,
+/// inclusive. Negative axes are supported. After converting negative axis to
+/// positive, axes outside the valid range will be clamped to a valid value,
+/// `start_axis` to `0` and `end_axis` to `ndim - 1`.
+///
+/// - Parameters:
+///     - a: input array
+///     - startAxis: first dim to flatten
+///     - endAxis: last dim to flatten
+///     - stream: stream or device to evaluate on
+public func flatten(
+    _ a: MLXArray, startAxis: Int, endAxis: Int = -1, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_flatten(&result, a.ctx, startAxis.int32, endAxis.int32, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Unflatten an axis of an array to a shape.
+///
+/// - Parameters:
+///     - a: input array
+///     - axis: axis to unflatten
+///     - shape: shape to unflatten into
+///     - stream: stream or device to evaluate on
+public func unflatten(
+    _ a: MLXArray, axis: Int, shape: some Collection<Int>, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_unflatten(&result, a.ctx, axis.int32, shape.map { Int32($0) }, shape.count, stream.ctx)
+    return MLXArray(result)
+}
+
+/// Force an array to be row contiguous. Copy if necessary.
+///
+/// - Parameters:
+///   - a: input array
+///   - allowColMajor: consider column major as contiguous and don’t copy
+///   - stream: stream or device to evaluate on
+/// - Returns: the row or col contiguous output.
+public func contiguous(
+    _ a: MLXArray, allowColMajor: Bool = false, stream: StreamOrDevice = .default
+) -> MLXArray {
+    var result = mlx_array_new()
+    mlx_contiguous(&result, a.ctx, allowColMajor, stream.ctx)
+    return MLXArray(result)
+}