mlx: Remove peak memory from the API

This is still in flux so it is better to just log it for now.
This commit is contained in:
Jesse Gross
2026-03-02 11:37:52 -08:00
parent c1e3ef4bcc
commit ad16bffc7d
5 changed files with 12 additions and 31 deletions

View File

@@ -558,7 +558,6 @@ func (s *Server) GenerateHandler(c *gin.Context) {
PromptEvalDuration: cr.PromptEvalDuration,
EvalCount: cr.EvalCount,
EvalDuration: cr.EvalDuration,
PeakMemory: cr.PeakMemory,
},
Logprobs: toAPILogprobs(cr.Logprobs),
}
@@ -2317,7 +2316,6 @@ func (s *Server) ChatHandler(c *gin.Context) {
PromptEvalDuration: r.PromptEvalDuration,
EvalCount: r.EvalCount,
EvalDuration: r.EvalDuration,
PeakMemory: r.PeakMemory,
},
Logprobs: toAPILogprobs(r.Logprobs),
}