Use fast (#38)

* update to latest mlx swift and use fast norms * gpu usage -> memory usage
2024-03-27 16:37:35 -07:00
parent 3314e20a24
commit 15b38cd146
4 changed files with 5 additions and 17 deletions
@@ -85,7 +85,7 @@ struct ContentView: View {
        .toolbar {
            ToolbarItem {
                Label(
-                    "GPU Usage: \(deviceStat.gpuUsage.activeMemory.formatted(.byteCount(style: .memory)))",
+                    "Memory Usage: \(deviceStat.gpuUsage.activeMemory.formatted(.byteCount(style: .memory)))",
                    systemImage: "info.circle.fill"
                )
                .labelStyle(.titleAndIcon)
@@ -9,7 +9,6 @@ import MLXNN

 // specialized norm for gemma
 private class RMSNorm: Module, UnaryLayer {
-
    let weight: MLXArray
    let eps: Float

@@ -19,13 +18,8 @@ private class RMSNorm: Module, UnaryLayer {
        super.init()
    }

-    func norm(_ x: MLXArray) -> MLXArray {
-        x * rsqrt(x.square().mean(axis: -1, keepDims: true) + eps)
-    }
-
    public func callAsFunction(_ x: MLXArray) -> MLXArray {
-        let output = norm(x.asType(Float.self)).asType(x.dtype)
-        return (1 + weight) * output
+        return MLXFast.rmsNorm(x, weight: 1.0 + self.weight, eps: self.eps)
    }
 }

@@ -7,12 +7,6 @@ import MLXNN

 // https://github.com/ml-explore/mlx-examples/blob/main/llms/mlx_lm/models/phi.py

-private class LayerNorm: MLXNN.LayerNorm {
-    override func callAsFunction(_ x: MLXArray) -> MLXArray {
-        super.callAsFunction(x.asType(Float.self)).asType(x.dtype)
-    }
-}
-
 private class PhiAttention: Module {

    let args: PhiConfiguration
@@ -1,5 +1,5 @@
 {
-  "originHash" : "73a943caf561dd1482e57053ba01456f25dea3267b2a84a996e42284e17aa6fc",
+  "originHash" : "da53546673b6d05016b6e5640c18814c7dba5b5af8db34715afe6d633037c758",
  "pins" : [
    {
      "identity" : "gzipswift",
@@ -16,7 +16,7 @@
      "location" : "https://github.com/ml-explore/mlx-swift",
      "state" : {
        "branch" : "main",
-        "revision" : "24e71937e12efe01a0d28a429a703036fae2ff8a"
+        "revision" : "5e51224ac869366017859dc0b07f6d2dc51b3bae"
      }
    },
    {
@@ -83,5 +83,5 @@
      }
    }
  ],
-  "version" : 2
+  "version" : 3
 }