From 3914f2377933f073785b54b923c0a00d49943e8d Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Wed, 6 May 2026 19:02:14 +0000
Subject: [PATCH 1/3] Initial plan


From 08a452c9e14553b6e15f4b6f36598682fa6428c1 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Wed, 6 May 2026 19:03:56 +0000
Subject: [PATCH 2/3] Fix macOS build: replace float std::from_chars with
 strtof in parse_csv

Agent-Logs-Url: https://github.com/audiohacking/acestep.cpp/sessions/3822a733-dbac-4964-8207-6418ecc203d9

Co-authored-by: lmangani <1423657+lmangani@users.noreply.github.com>
---
 src/pipeline-synth-ops.cpp | 49 ++++++++++++++++++++++++++++----------
 1 file changed, 37 insertions(+), 12 deletions(-)
diff --git a/src/pipeline-synth-ops.cpp b/src/pipeline-synth-ops.cpp
index 7ea93bd..10995d3 100644
--- a/src/pipeline-synth-ops.cpp
+++ b/src/pipeline-synth-ops.cpp
@@ -13,6 +13,7 @@
 #include "vae-enc.h"
 
 #include <charconv>
+#include <cerrno>
 #include <cstdio>
 #include <cstdlib>
 #include <cstring>
@@ -22,22 +23,23 @@
 
 static const int FRAMES_PER_SECOND = 25;
 
-// CSV list parser tolerant to any whitespace around commas. Locale-immune via
-// std::from_chars (C++17 charconv, overloaded on the numeric type). Used for
-// audio_codes (int) and custom_timesteps (float). Bails on first parse error
-// or overflow, returning the values consumed so far.
-template <typename T> static std::vector<T> parse_csv(const std::string & s) {
-    std::vector<T> out;
-    const char *   first = s.data();
-    const char *   last  = first + s.size();
+// CSV list parsers tolerant to any whitespace around commas. Bail on first
+// parse error or overflow, returning the values consumed so far.
+// Integer variant uses std::from_chars (locale-immune, C++17 charconv).
+// Float variant uses std::strtof for portability (Apple Clang lacks the
+// floating-point overload of std::from_chars on some SDK versions).
+static std::vector<int> parse_csv_int(const std::string & s) {
+    std::vector<int> out;
+    const char *     first = s.data();
+    const char *     last  = first + s.size();
     while (first < last) {
         while (first < last && (*first == ',' || *first == ' ')) {
-            first++;
+            ++first;
         }
         if (first == last) {
             break;
         }
-        T    v{};
+        int  v{};
         auto r = std::from_chars(first, last, v);
         if (r.ec != std::errc{}) {
             break;
@@ -48,6 +50,29 @@ template <typename T> static std::vector<T> parse_csv(const std::string & s) {
     return out;
 }
 
+static std::vector<float> parse_csv_float(const std::string & s) {
+    std::vector<float> out;
+    const char *       first = s.data();
+    const char *       last  = first + s.size();
+    while (first < last) {
+        while (first < last && (*first == ',' || *first == ' ')) {
+            ++first;
+        }
+        if (first == last) {
+            break;
+        }
+        char * end = nullptr;
+        errno      = 0;
+        float  v   = std::strtof(first, &end);
+        if (end == first || errno == ERANGE) {
+            break;
+        }
+        out.push_back(v);
+        first = end;
+    }
+    return out;
+}
+
 int ops_encode_src(const AceSynth * ctx,
                    const float *    src_audio,
                    int              src_len,
@@ -199,7 +224,7 @@ int ops_resolve_params(const AceSynth * ctx, const AceRequest * reqs, int batch_
     s.max_codes_len = 0;
     s.have_codes    = false;
     for (int b = 0; b < batch_n; b++) {
-        s.per_codes[b] = parse_csv<int>(reqs[b].audio_codes);
+        s.per_codes[b] = parse_csv_int(reqs[b].audio_codes);
         int sz         = (int) s.per_codes[b].size();
         if (sz > s.max_codes_len) {
             s.max_codes_len = sz;
@@ -222,7 +247,7 @@ void ops_build_schedule(SynthState & s) {
     // endpoint handled implicitly by the sampler, so we drop it and take
     // schedule = first N-1 entries, num_steps = N-1.
     if (!s.rr.custom_timesteps.empty()) {
-        std::vector<float> ts = parse_csv<float>(s.rr.custom_timesteps);
+        std::vector<float> ts = parse_csv_float(s.rr.custom_timesteps);
         if (ts.size() >= 2) {
             s.num_steps = (int) ts.size() - 1;
             s.schedule.assign(ts.begin(), ts.end() - 1);

From 635417fac59baf30d451e38507d70a909f97fc0d Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Wed, 6 May 2026 19:08:46 +0000
Subject: [PATCH 3/3] Fix clang-format violations in pipeline-synth-ops.cpp,
 qwen3-enc.h, dit-graph.h

Agent-Logs-Url: https://github.com/audiohacking/acestep.cpp/sessions/b1a4e02e-b7cf-4128-ac70-fd9acd368334

Co-authored-by: lmangani <1423657+lmangani@users.noreply.github.com>
---
 src/dit-graph.h            | 16 ++++++++++++----
 src/pipeline-synth-ops.cpp |  4 ++--
 src/qwen3-enc.h            |  8 ++++++--
 3 files changed, 20 insertions(+), 8 deletions(-)

diff --git a/src/dit-graph.h b/src/dit-graph.h
index 9601411..840d200 100644
--- a/src/dit-graph.h
+++ b/src/dit-graph.h
@@ -216,8 +216,12 @@ static struct ggml_tensor * dit_ggml_build_self_attn(
     // K/V come in F32 from mul_mat (no KV cache here). Cast to F16 before FA,
     // mirroring llama.cpp build_attn_mha for graphs without a KV cache.
     if (m->use_flash_attn) {
-        if (k->type == GGML_TYPE_F32) k = ggml_cast(ctx, k, GGML_TYPE_F16);
-        if (v->type == GGML_TYPE_F32) v = ggml_cast(ctx, v, GGML_TYPE_F16);
+        if (k->type == GGML_TYPE_F32) {
+            k = ggml_cast(ctx, k, GGML_TYPE_F16);
+        }
+        if (v->type == GGML_TYPE_F32) {
+            v = ggml_cast(ctx, v, GGML_TYPE_F16);
+        }
     }
 
     struct ggml_tensor * attn = m->use_flash_attn ? ggml_flash_attn_ext(ctx, q, k, v, mask, scale, 0.0f, 0.0f) :
@@ -333,8 +337,12 @@ static struct ggml_tensor * dit_ggml_build_cross_attn(struct ggml_context * ctx,
     // K/V come in F32 from mul_mat (no KV cache here). Cast to F16 before FA,
     // mirroring llama.cpp build_attn_mha for graphs without a KV cache.
     if (m->use_flash_attn) {
-        if (k->type == GGML_TYPE_F32) k = ggml_cast(ctx, k, GGML_TYPE_F16);
-        if (v->type == GGML_TYPE_F32) v = ggml_cast(ctx, v, GGML_TYPE_F16);
+        if (k->type == GGML_TYPE_F32) {
+            k = ggml_cast(ctx, k, GGML_TYPE_F16);
+        }
+        if (v->type == GGML_TYPE_F32) {
+            v = ggml_cast(ctx, v, GGML_TYPE_F16);
+        }
     }
 
     struct ggml_tensor * attn = m->use_flash_attn ? ggml_flash_attn_ext(ctx, q, k, v, mask, scale, 0.0f, 0.0f) :
diff --git a/src/pipeline-synth-ops.cpp b/src/pipeline-synth-ops.cpp
index 10995d3..269f108 100644
--- a/src/pipeline-synth-ops.cpp
+++ b/src/pipeline-synth-ops.cpp
@@ -12,8 +12,8 @@
 #include "task-types.h"
 #include "vae-enc.h"
 
-#include <charconv>
 #include <cerrno>
+#include <charconv>
 #include <cstdio>
 #include <cstdlib>
 #include <cstring>
@@ -63,7 +63,7 @@ static std::vector<float> parse_csv_float(const std::string & s) {
         }
         char * end = nullptr;
         errno      = 0;
-        float  v   = std::strtof(first, &end);
+        float v    = std::strtof(first, &end);
         if (end == first || errno == ERANGE) {
             break;
         }
diff --git a/src/qwen3-enc.h b/src/qwen3-enc.h
index 9d99201..6fd2463 100644
--- a/src/qwen3-enc.h
+++ b/src/qwen3-enc.h
@@ -184,8 +184,12 @@ static struct ggml_tensor * qwen3_build_self_attn(struct ggml_context * ctx,
     // K/V come in F32 from mul_mat (encoder, no KV cache). Cast to F16 before FA,
     // mirroring llama.cpp build_attn_mha for graphs without a KV cache.
     if (use_flash_attn) {
-        if (k->type == GGML_TYPE_F32) k = ggml_cast(ctx, k, GGML_TYPE_F16);
-        if (v->type == GGML_TYPE_F32) v = ggml_cast(ctx, v, GGML_TYPE_F16);
+        if (k->type == GGML_TYPE_F32) {
+            k = ggml_cast(ctx, k, GGML_TYPE_F16);
+        }
+        if (v->type == GGML_TYPE_F32) {
+            v = ggml_cast(ctx, v, GGML_TYPE_F16);
+        }
     }
 
     struct ggml_tensor * attn = use_flash_attn ? ggml_flash_attn_ext(ctx, q, k, v, mask, scale, 0.0f, 0.0f) :