Further clean of rope

Phylliida · Phylliida · commit 8d7f6793bcb4 · 2025-10-24T15:24:59.000-07:00
diff --git a/rope.hpp b/rope.hpp
@@ -44,7 +44,7 @@ namespace Rope {
     __STATIC_INLINE__ std::vector<std::vector<float>> rope(const std::vector<float>& pos,
                                                            int dim,
                                                            int theta,
-                                                           const std::vector<int>* wraps = nullptr) {
+                                                           const std::vector<int>* wrap_dims = nullptr) {
         assert(dim % 2 == 0);
         int half_dim = dim / 2;
 
@@ -63,16 +63,16 @@ namespace Rope {
                 float omega_val       = omega[j];
                 float original_angle  = position * omega_val;
                 float angle           = original_angle;
-                float wrap = 0;
-                if (wraps != nullptr && !wraps->empty()) {
-                    size_t wrap_size = wraps->size();
+                int wrap_dim = 0;
+                if (wrap_dims != nullptr && !wrap_dims->empty()) {
+                    size_t wrap_size = wrap_dims->size();
                     // mod batch size since we only store this for one item in the batch
                     size_t wrap_idx  = wrap_size > 0 ? (i % wrap_size) : 0;
-                    wrap             = (*wraps)[wrap_idx];
+                    wrap_dim             = (*wrap_dims)[wrap_idx];
                 }
-                if (wrap > 0) {
+                if (wrap_dim > 0) {
                     constexpr float TWO_PI = 6.28318530717958647692f;
-                    float wrap_f            = static_cast<float>(wrap);
+                    float wrap_f            = static_cast<float>(wrap_dim);
                     float cycles            = omega_val * wrap_f / TWO_PI;
                     // closest periodic harmonic, necessary to ensure things neatly tile
                     // without this round, things don't tile at the boundaries and you end up
@@ -144,7 +144,7 @@ namespace Rope {
                                                   int bs,
                                                   int theta,
                                                   const std::vector<int>& axes_dim,
-                                                  const std::vector<std::vector<int>>* axes_wraps = nullptr) {
+                                                  const std::vector<std::vector<int>>* wrap_dims = nullptr) {
         std::vector<std::vector<float>> trans_ids = transpose(ids);
         size_t pos_len                            = ids.size() / bs;
         int num_axes                              = axes_dim.size();
@@ -159,12 +159,12 @@ namespace Rope {
         std::vector<std::vector<float>> emb(bs * pos_len, std::vector<float>(emb_dim * 2 * 2, 0.0));
         int offset = 0;
         for (int i = 0; i < num_axes; ++i) {
-            const std::vector<int>* axis_wrap = nullptr;
-            if (axes_wraps != nullptr && i < (int)axes_wraps->size()) {
-                axis_wrap = &(*axes_wraps)[i];
+            const std::vector<int>* axis_wrap_dims = nullptr;
+            if (wrap_dims != nullptr && i < (int)wrap_dims->size()) {
+                axis_wrap_dims = &(*wrap_dims)[i];
             }
             std::vector<std::vector<float>> rope_emb =
-                rope(trans_ids[i], axes_dim[i], theta, axis_wrap);  // [bs*pos_len, axes_dim[i]/2 * 2 * 2]
+                rope(trans_ids[i], axes_dim[i], theta, axis_wrap_dims);  // [bs*pos_len, axes_dim[i]/2 * 2 * 2]
             for (int b = 0; b < bs; ++b) {
                 for (int j = 0; j < pos_len; ++j) {
                     for (int k = 0; k < rope_emb[0].size(); ++k) {
@@ -277,11 +277,10 @@ namespace Rope {
                                                            const std::vector<ggml_tensor*>& ref_latents,
                                                            bool increase_ref_index,
                                                            int theta,
-                                                           const std::vector<int>& axes_dim,
-                                                           bool circular = false) {
-        circular = true;
+                                                           const std::vector<int>& axes_dim) {
         std::vector<std::vector<float>> ids = gen_qwen_image_ids(h, w, patch_size, bs, context_len, ref_latents, increase_ref_index);
-        std::vector<std::vector<int>> axes_wraps;
+        std::vector<std::vector<int>> wrap_dims;
+        // This logic simply stores the (pad and patch_adjusted) sizes of images so we can make sure rope correctly tiles
         if (sd_is_circular_padding_enabled() && bs > 0 && axes_dim.size() >= 3) {
             int pad_h = (patch_size - (h % patch_size)) % patch_size;
             int pad_w = (patch_size - (w % patch_size)) % patch_size;
@@ -290,14 +289,15 @@ namespace Rope {
             if (h_len > 0 && w_len > 0) {
                 const size_t total_tokens     = ids.size();
                 // Track per-token wrap lengths for the row/column axes so only spatial tokens become periodic.
-                axes_wraps.assign(axes_dim.size(), std::vector<int>(total_tokens / bs, 0));
+                wrap_dims.assign(axes_dim.size(), std::vector<int>(total_tokens / bs, 0));
                 size_t cursor = context_len; // ignore text tokens
                 const size_t img_tokens       = static_cast<size_t>(h_len) * static_cast<size_t>(w_len);
                 for (size_t token_i = 0; token_i < img_tokens; ++token_i) {
-                    axes_wraps[1][cursor + token_i] = h_len;
-                    axes_wraps[2][cursor + token_i] = w_len;
+                    wrap_dims[1][cursor + token_i] = h_len;
+                    wrap_dims[2][cursor + token_i] = w_len;
                 }
                 cursor += img_tokens;
+                // For each reference image, store wrap sizes as well
                 for (ggml_tensor* ref : ref_latents) {
                     if (ref == nullptr) {
                         continue;
@@ -310,14 +310,14 @@ namespace Rope {
                     int ref_w_len  = (ref_w + ref_pad_w) / patch_size;
                     size_t ref_n_tokens  = static_cast<size_t>(ref_h_len) * static_cast<size_t>(ref_w_len);
                     for (size_t token_i = 0; token_i < ref_n_tokens; ++token_i) {
-                        axes_wraps[1][cursor + token_i] = ref_h_len;
-                        axes_wraps[2][cursor + token_i] = ref_w_len;
+                        wrap_dims[1][cursor + token_i] = ref_h_len;
+                        wrap_dims[2][cursor + token_i] = ref_w_len;
                     }
                     cursor += ref_n_tokens;
                 }
             }
         }
-        const std::vector<std::vector<int>>* wraps_ptr = axes_wraps.empty() ? nullptr : &axes_wraps;
+        const std::vector<std::vector<int>>* wraps_ptr = wrap_dims.empty() ? nullptr : &wrap_dims;
         return embed_nd(ids, bs, theta, axes_dim, wraps_ptr);
     }