chaokunyang commented on code in PR #3216:
URL: https://github.com/apache/fory/pull/3216#discussion_r2730143855


##########
cpp/fory/python/pyfory.cc:
##########
@@ -58,4 +58,133 @@ int Fory_PyFloatSequenceWriteToBuffer(PyObject *collection, 
Buffer *buffer,
   }
   return 0;
 }
+
+// Write varint64 with ZigZag encoding inline
+// Returns number of bytes written
+static inline uint32_t WriteVarint64ZigZag(uint8_t *arr, int64_t value) {
+  // ZigZag encoding: (value << 1) ^ (value >> 63)
+  uint64_t v = (static_cast<uint64_t>(value) << 1) ^
+               (static_cast<uint64_t>(value >> 63));
+
+  if (v < 0x80) {
+    arr[0] = static_cast<uint8_t>(v);
+    return 1;
+  }
+  arr[0] = static_cast<uint8_t>((v & 0x7F) | 0x80);
+  if (v < 0x4000) {
+    arr[1] = static_cast<uint8_t>(v >> 7);
+    return 2;
+  }
+  arr[1] = static_cast<uint8_t>((v >> 7) | 0x80);
+  if (v < 0x200000) {
+    arr[2] = static_cast<uint8_t>(v >> 14);
+    return 3;
+  }
+  arr[2] = static_cast<uint8_t>((v >> 14) | 0x80);
+  if (v < 0x10000000) {
+    arr[3] = static_cast<uint8_t>(v >> 21);
+    return 4;
+  }
+  arr[3] = static_cast<uint8_t>((v >> 21) | 0x80);
+  if (v < 0x800000000ULL) {
+    arr[4] = static_cast<uint8_t>(v >> 28);
+    return 5;
+  }
+  arr[4] = static_cast<uint8_t>((v >> 28) | 0x80);
+  if (v < 0x40000000000ULL) {
+    arr[5] = static_cast<uint8_t>(v >> 35);
+    return 6;
+  }
+  arr[5] = static_cast<uint8_t>((v >> 35) | 0x80);
+  if (v < 0x2000000000000ULL) {
+    arr[6] = static_cast<uint8_t>(v >> 42);
+    return 7;
+  }
+  arr[6] = static_cast<uint8_t>((v >> 42) | 0x80);
+  if (v < 0x100000000000000ULL) {
+    arr[7] = static_cast<uint8_t>(v >> 49);
+    return 8;
+  }
+  arr[7] = static_cast<uint8_t>((v >> 49) | 0x80);
+  arr[8] = static_cast<uint8_t>(v >> 56);
+  return 9;
+}
+
+Py_ssize_t Fory_PyInt64SequenceWriteToBuffer(PyObject *collection,

Review Comment:
   Fory_PyInt64SequenceWriteToBuffer returns -1 and sets PyErr when an element 
is out of int64
       range (or not an int), but the Cython caller only checks bytes_written 
>= 0 and doesn’t
       propagate the exception. Because the extern declaration has no except 
clause, the error is
       silently ignored and the header is written without advancing 
writer_index, corrupting the
       stream for lists with large Python ints (e.g., >2^63-1). Please check 
bytes_written < 0 and
       raise/fall back to the slow path.



-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: [email protected]

For queries about this service, please contact Infrastructure at:
[email protected]


---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]

Reply via email to