Monday, July 23, 2007

Collections deepEquals()

There was some discussion on Eamonn McManus's blog (java.net) about Arrays.deepEquals() and a collections version. http://weblogs.java.net/blog/emcmanus/archive/2007/07/comparing_objec.html

I've decided to construct a first attempt at this. The idea is that two lists are deepEqual if the elements in them are equal. Of course the elements in a list can be other lists and so on. This applies to Sets and Maps also. This code attempts to be generic enough to compare two collections of the same type for deep equality. This is only a first attempt I'm sure there can be some enhancements/optimizations made.


NOTE: It does not (yet) handle collections that include themselves.


import java.util.ArrayList;
import java.util.Collection;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.TreeSet;


public class DeepEqualsTest {

/**
* @param args
*/
public static void main(String args[]) {

ArrayList<Object> stuff1 = new ArrayList<Object>();
stuff1.add(null);
stuff1.add("A");
stuff1.add(new Object[] { "B", "C", null });

ArrayList<Object> stuff2 = new ArrayList<Object>();
stuff2.add(null);
stuff2.add("A");
stuff2.add(new Object[] { "B", "C", null });

TreeSet<Integer> ts1 = new TreeSet<Integer>();
ts1.add(1);
ts1.add(3);
ts1.add(2);

TreeSet<Integer> ts2 = new TreeSet<Integer>();
ts2.add(1);
ts2.add(2);
ts2.add(3);
// ts2.add(4);

HashMap<String, Object> map1 = new HashMap<String, Object>();
HashMap<String, Object> map2 = new HashMap<String, Object>();

map1.put("key1", new Object[] { ts1, "hi", 123, 456 });
map2.put("key1", new Object[] { ts2, "hi", 123, 456 });

stuff1.add(map1);
stuff2.add(map2);

System.out.println("Result = " + deepEquals(stuff1, stuff2));
}

/**
* An implementation of "deep equals" for collection classes, built in the
* Arrays.deepEquals() style. It attempts to compare equality based on the
* contents of the collection.
*
* @param t1 -
* first object, most likely a collection of some sort.
* @param t2 -
* second object, most likely a collection of some sort.
* @return - true if the content of the collections are equal.
*/
public static <T> boolean deepEquals(T t1, T t2) {

if (t1 == t2) {
return true;
}

if (t1 == null || t2 == null) {
return false;
}

if (t1 instanceof Map && t2 instanceof Map) {
return mapDeepEquals((Map<?, ?>) t1, (Map<?, ?>) t2);
} else if (t1 instanceof List && t2 instanceof List) {
return linearDeepEquals((List<?>) t1, (List<?>) t2);

} else if (t1 instanceof Set && t2 instanceof Set) {
return linearDeepEquals((Set<?>) t1, (Set<?>) t2);

} else if (t1 instanceof Object[] && t2 instanceof Object[]) {
return linearDeepEquals((Object[]) t1, (Object[]) t2);

} else {
return t1.equals(t2);
}
}

/**
* Compares two maps for equality. This is based around the idea that if the
* keys are deep equal and the values the keys return are deep equal then
* the maps are equal.
*
* @param m1 -
* first map
* @param m2 -
* second map
* @return - weather the maps are deep equal
*/
private static boolean mapDeepEquals(Map<?, ?> m1, Map<?, ?> m2) {
if (m1.size() != m1.size()) {
return false;
}

Set<?> allKeys = m1.keySet();
if (!linearDeepEquals(allKeys, m2.keySet())) {
return false;
}

for (Object key : allKeys) {
if (!deepEquals(m1.get(key), m2.get(key))) {
return false;
}
}
return true;
}

/**
* Compares two Collections for deep equality.
*
* @param s1
* @param s2
* @return
*/
private static boolean linearDeepEquals(Collection<?> s1, Collection<?> s2) {
if (s1.size() != s2.size()) {
return false;
}

for (Object s1Item : s1) {
boolean found = false;
for (Object s2Item : s2) {
if (deepEquals(s2Item, s1Item)) {
found = true;
break;
}
}
if (!found) {
return false;
}
}
return true;
}

/**
* Compares two Object[] for deep equality
*
* @param s1
* @param s2
* @return
*/
private static boolean linearDeepEquals(Object[] s1, Object[] s2) {

if (s1.length != s2.length) {
return false;
}

for (Object s1Item : s1) {
boolean found = false;
for (Object s2Item : s2) {
if (deepEquals(s2Item, s1Item)) {
found = true;
break;
}
}
if (!found) {
return false;
}
}
return true;
}
}

2 comments:

AlexFace said...

Hi,

seems like your code will compare all Collections as Sets (without checking the order), meanwhile two Lists are not equal if they contain the same elements but in a different order.

Unknown said...

Very good point. But there are some sets that are order dependent, like SortedSet. I will adjust and repost at some point. There is probably a much better design for this type of functionality, like a getDeepEqulator() method that would return an object capable of dealing with these issues.