zeroshade commented on code in PR #35823:
URL: https://github.com/apache/arrow/pull/35823#discussion_r1210566705


##########
go/arrow/array/compare.go:
##########
@@ -732,3 +732,57 @@ func arrayApproxEqualStruct(left, right *Struct, opt 
equalOption) bool {
        }
        return true
 }
+
+// arrayApproxEqualMap doesn't care about the order of keys (in Go map 
traversal order is undefined)
+func arrayApproxEqualMap(left, right *Map, opt equalOption) bool {
+       for i := 0; i < left.Len(); i++ {
+               if left.IsNull(i) {
+                       continue
+               }
+               if 
!arrayApproxEqualSingleMapEntry(left.newListValue(i).(*Struct), 
right.newListValue(i).(*Struct), opt) {
+                       return false
+               }
+       }
+       return true
+}
+
+// arrayApproxEqualSingleMapEntry is a helper function that checks if a single 
entry pair is approx equal.
+// Basically, it doesn't care about key order.
+// structs passed will be released
+func arrayApproxEqualSingleMapEntry(left, right *Struct, opt equalOption) bool 
{
+       defer left.Release()
+       defer right.Release()
+
+       // Every element here is a key-value pair
+       lElems := make([]arrow.Array, left.Len())
+       rElems := make([]arrow.Array, right.Len())
+       for i := 0; i < left.Len(); i++ {
+               lElems[i] = NewSlice(left, int64(i), int64(i+1))
+               rElems[i] = NewSlice(right, int64(i), int64(i+1))
+       }
+       defer func() {
+               for i := range lElems {
+                       lElems[i].Release()
+                       rElems[i].Release()
+               }
+       }()
+
+       used := make(map[int]bool, right.Len())
+       for _, ll := range lElems {
+               found := false
+               for i, rr := range rElems {
+                       if used[i] {
+                               continue
+                       }
+                       if arrayApproxEqual(ll, rr, opt) {
+                               found = true
+                               used[i] = true
+                               break
+                       }
+               }

Review Comment:
   rather than calling `arrayApproxEqual` on the whole struct, we should 
probably be just comparing the first field (the key field) of each and then 
*only* comparing the second field (the value field) if the first field matched.



##########
go/arrow/array/compare.go:
##########
@@ -732,3 +732,57 @@ func arrayApproxEqualStruct(left, right *Struct, opt 
equalOption) bool {
        }
        return true
 }
+
+// arrayApproxEqualMap doesn't care about the order of keys (in Go map 
traversal order is undefined)
+func arrayApproxEqualMap(left, right *Map, opt equalOption) bool {
+       for i := 0; i < left.Len(); i++ {
+               if left.IsNull(i) {
+                       continue
+               }
+               if 
!arrayApproxEqualSingleMapEntry(left.newListValue(i).(*Struct), 
right.newListValue(i).(*Struct), opt) {
+                       return false
+               }
+       }
+       return true
+}
+
+// arrayApproxEqualSingleMapEntry is a helper function that checks if a single 
entry pair is approx equal.
+// Basically, it doesn't care about key order.
+// structs passed will be released
+func arrayApproxEqualSingleMapEntry(left, right *Struct, opt equalOption) bool 
{
+       defer left.Release()
+       defer right.Release()
+
+       // Every element here is a key-value pair
+       lElems := make([]arrow.Array, left.Len())
+       rElems := make([]arrow.Array, right.Len())
+       for i := 0; i < left.Len(); i++ {
+               lElems[i] = NewSlice(left, int64(i), int64(i+1))
+               rElems[i] = NewSlice(right, int64(i), int64(i+1))
+       }
+       defer func() {
+               for i := range lElems {
+                       lElems[i].Release()
+                       rElems[i].Release()
+               }
+       }()

Review Comment:
   why are these slices necessary? can't you just use the indices of the arrays 
themselves? 
   
   you could also just use `sliceApproxEqual` rather than creating a bunch of 
slices up front



##########
go/arrow/array/compare.go:
##########
@@ -732,3 +732,57 @@ func arrayApproxEqualStruct(left, right *Struct, opt 
equalOption) bool {
        }
        return true
 }
+
+// arrayApproxEqualMap doesn't care about the order of keys (in Go map 
traversal order is undefined)
+func arrayApproxEqualMap(left, right *Map, opt equalOption) bool {
+       for i := 0; i < left.Len(); i++ {
+               if left.IsNull(i) {
+                       continue
+               }
+               if 
!arrayApproxEqualSingleMapEntry(left.newListValue(i).(*Struct), 
right.newListValue(i).(*Struct), opt) {
+                       return false
+               }
+       }
+       return true
+}
+
+// arrayApproxEqualSingleMapEntry is a helper function that checks if a single 
entry pair is approx equal.
+// Basically, it doesn't care about key order.
+// structs passed will be released
+func arrayApproxEqualSingleMapEntry(left, right *Struct, opt equalOption) bool 
{
+       defer left.Release()
+       defer right.Release()
+
+       // Every element here is a key-value pair
+       lElems := make([]arrow.Array, left.Len())
+       rElems := make([]arrow.Array, right.Len())
+       for i := 0; i < left.Len(); i++ {
+               lElems[i] = NewSlice(left, int64(i), int64(i+1))
+               rElems[i] = NewSlice(right, int64(i), int64(i+1))
+       }
+       defer func() {
+               for i := range lElems {
+                       lElems[i].Release()
+                       rElems[i].Release()
+               }
+       }()
+
+       used := make(map[int]bool, right.Len())
+       for _, ll := range lElems {
+               found := false
+               for i, rr := range rElems {
+                       if used[i] {
+                               continue
+                       }
+                       if arrayApproxEqual(ll, rr, opt) {
+                               found = true
+                               used[i] = true
+                               break
+                       }
+               }
+               if !found {
+                       return false
+               }
+       }
+       return true

Review Comment:
   should verify that `len(used)` == `right.Len()`. Otherwise this would return 
true in the case where the right side contains keys the left side was missing. 
   
   Should also add test cases for failed comparisons where keys have different 
values and when keys are missing between the operands.



-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: [email protected]

For queries about this service, please contact Infrastructure at:
[email protected]

Reply via email to