fix #231 -- use Embedding.asLinear (#232)

davidkoski · web-flow · commit f35df96f0c66 · 2025-03-10T10:35:39.000-07:00
diff --git a/Libraries/MLXLLM/Models/Cohere.swift b/Libraries/MLXLLM/Models/Cohere.swift
@@ -163,7 +163,7 @@ public class CohereModel: Module, LLMModel, KVCacheDimensionProvider {
 
     public func callAsFunction(_ inputs: MLXArray, cache: [KVCache]?) -> MLXArray {
         var out = model(inputs, cache: cache)
-        out = matmul(out, model.embedTokens.weight.T)
+        out = model.embedTokens.asLinear(out)
         out = out * self.logitScale
         return out
     }
diff --git a/Libraries/MLXLLM/Models/OpenELM.swift b/Libraries/MLXLLM/Models/OpenELM.swift
@@ -199,7 +199,7 @@ public class OpenELMModel: Module, LLMModel, KVCacheDimensionProvider {
         if let lmHead {
             out = lmHead(out)
         } else {
-            out = matmul(out, transformer.embedTokens.weight.T)
+            out = transformer.embedTokens.asLinear(out)
         }
 
         return out
diff --git a/Libraries/MLXLLM/Models/Starcoder2.swift b/Libraries/MLXLLM/Models/Starcoder2.swift
@@ -173,7 +173,7 @@ public class Starcoder2Model: Module, LLMModel, KVCacheDimensionProvider {
         if !tieWordEmbeddings {
             return lmHead(out)
         } else {
-            out = matmul(out, model.embedTokens.weight.T)
+            out = model.embedTokens.asLinear(out)
             return out
         }
     }

Original file line number	Diff line number	Diff line change
`@@ -163,7 +163,7 @@ public class CohereModel: Module, LLMModel, KVCacheDimensionProvider {`
`163`	`163`
`164`	`164`	`public func callAsFunction(_ inputs: MLXArray, cache: [KVCache]?) -> MLXArray {`
`165`	`165`	`var out = model(inputs, cache: cache)`
`166`		`- out = matmul(out, model.embedTokens.weight.T)`
	`166`	`+ out = model.embedTokens.asLinear(out)`
`167`	`167`	`out = out * self.logitScale`
`168`	`168`	`return out`
`169`	`169`	`}`
Original file line number	Diff line number	Diff line change
`@@ -199,7 +199,7 @@ public class OpenELMModel: Module, LLMModel, KVCacheDimensionProvider {`
`199`	`199`	`if let lmHead {`
`200`	`200`	`out = lmHead(out)`
`201`	`201`	`} else {`
`202`		`- out = matmul(out, transformer.embedTokens.weight.T)`
	`202`	`+ out = transformer.embedTokens.asLinear(out)`
`203`	`203`	`}`
`204`	`204`
`205`	`205`	`return out`
Original file line number	Diff line number	Diff line change
`@@ -173,7 +173,7 @@ public class Starcoder2Model: Module, LLMModel, KVCacheDimensionProvider {`
`173`	`173`	`if !tieWordEmbeddings {`
`174`	`174`	`return lmHead(out)`
`175`	`175`	`} else {`
`176`		`- out = matmul(out, model.embedTokens.weight.T)`
	`176`	`+ out = model.embedTokens.asLinear(out)`
`177`	`177`	`return out`
`178`	`178`	`}`
`179`	`179`	`}`