aboutsummaryrefslogtreecommitdiffstats
path: root/subprojects/store
diff options
context:
space:
mode:
authorLibravatar OszkarSemerath <semerath@mit.bme.hu>2023-07-21 21:14:18 +0200
committerLibravatar OszkarSemerath <semerath@mit.bme.hu>2023-07-21 21:14:18 +0200
commit04860420ded195f9434477dab33309da61edc7e9 (patch)
treee7a9b5963eac3cdae84375f28f81a359c41d0b97 /subprojects/store
parentVersionedMapStoreFactoryBuilder.java is introduced, all tests are updated. (diff)
downloadrefinery-04860420ded195f9434477dab33309da61edc7e9.tar.gz
refinery-04860420ded195f9434477dab33309da61edc7e9.tar.zst
refinery-04860420ded195f9434477dab33309da61edc7e9.zip
Improved tuple hash calculation
- by special handling of unary and binary relations - introducing murmur32Scramble
Diffstat (limited to 'subprojects/store')
-rw-r--r--subprojects/store/src/main/java/tools/refinery/store/model/TupleHashProvider.java125
1 files changed, 91 insertions, 34 deletions
diff --git a/subprojects/store/src/main/java/tools/refinery/store/model/TupleHashProvider.java b/subprojects/store/src/main/java/tools/refinery/store/model/TupleHashProvider.java
index 4bcf9ff4..1183b8f2 100644
--- a/subprojects/store/src/main/java/tools/refinery/store/model/TupleHashProvider.java
+++ b/subprojects/store/src/main/java/tools/refinery/store/model/TupleHashProvider.java
@@ -2,39 +2,43 @@ package tools.refinery.store.model;
2 2
3import tools.refinery.store.map.ContinousHashProvider; 3import tools.refinery.store.map.ContinousHashProvider;
4import tools.refinery.store.tuple.Tuple; 4import tools.refinery.store.tuple.Tuple;
5import tools.refinery.store.tuple.Tuple1;
6import tools.refinery.store.tuple.Tuple2;
5 7
6public class TupleHashProvider implements ContinousHashProvider<Tuple> { 8public class TupleHashProvider implements ContinousHashProvider<Tuple> {
7 protected static final int[] primes = new int[] { 31, 37, 41, 43, 47, 53, 59, 61, 67, 71, 73, 79, 83, 89, 97, 101, 9 protected static final int[] primes = new int[] { 2, 3, 5, 7, 11, 13, 17, 19, 23, 29, 31, 37, 41, 43, 47, 53, 59,
8 103, 107, 109, 113, 127, 131, 137, 139, 149, 151, 157, 163, 167, 173, 179, 181, 191, 193, 197, 199, 211, 10 61, 67, 71, 73, 79, 83, 89, 97, 101, 103, 107, 109, 113, 127, 131, 137, 139, 149, 151, 157, 163, 167, 173,
9 223, 227, 229, 233, 239, 241, 251, 257, 263, 269, 271, 277, 281, 283, 293, 307, 311, 313, 317, 331, 337, 11 179, 181, 191, 193, 197, 199, 211, 223, 227, 229, 233, 239, 241, 251, 257, 263, 269, 271, 277, 281, 283,
10 347, 349, 353, 359, 367, 373, 379, 383, 389, 397, 401, 409, 419, 421, 431, 433, 439, 443, 449, 457, 461, 12 293, 307, 311, 313, 317, 331, 337, 347, 349, 353, 359, 367, 373, 379, 383, 389, 397, 401, 409, 419, 421,
11 463, 467, 479, 487, 491, 499, 503, 509, 521, 523, 541, 547, 557, 563, 569, 571, 577, 587, 593, 599, 601, 13 431, 433, 439, 443, 449, 457, 461, 463, 467, 479, 487, 491, 499, 503, 509, 521, 523, 541, 547, 557, 563,
12 607, 613, 617, 619, 631, 641, 643, 647, 653, 659, 661, 673, 677, 683, 691, 701, 709, 719, 727, 733, 739, 14 569, 571, 577, 587, 593, 599, 601, 607, 613, 617, 619, 631, 641, 643, 647, 653, 659, 661, 673, 677, 683,
13 743, 751, 757, 761, 769, 773, 787, 797, 809, 811, 821, 823, 827, 829, 839, 853, 857, 859, 863, 877, 881, 15 691, 701, 709, 719, 727, 733, 739, 743, 751, 757, 761, 769, 773, 787, 797, 809, 811, 821, 823, 827, 829,
14 883, 887, 907, 911, 919, 929, 937, 941, 947, 953, 967, 971, 977, 983, 991, 997, 1009, 1013, 1019, 1021, 16 839, 853, 857, 859, 863, 877, 881, 883, 887, 907, 911, 919, 929, 937, 941, 947, 953, 967, 971, 977, 983,
15 1031, 1033, 1039, 1049, 1051, 1061, 1063, 1069, 1087, 1091, 1093, 1097, 1103, 1109, 1117, 1123, 1129, 1151, 17 991, 997, 1009, 1013, 1019, 1021, 1031, 1033, 1039, 1049, 1051, 1061, 1063, 1069, 1087, 1091, 1093, 1097,
16 1153, 1163, 1171, 1181, 1187, 1193, 1201, 1213, 1217, 1223, 1229, 1231, 1237, 1249, 1259, 1277, 1279, 1283, 18 1103, 1109, 1117, 1123, 1129, 1151, 1153, 1163, 1171, 1181, 1187, 1193, 1201, 1213, 1217, 1223, 1229, 1231,
17 1289, 1291, 1297, 1301, 1303, 1307, 1319, 1321, 1327, 1361, 1367, 1373, 1381, 1399, 1409, 1423, 1427, 1429, 19 1237, 1249, 1259, 1277, 1279, 1283, 1289, 1291, 1297, 1301, 1303, 1307, 1319, 1321, 1327, 1361, 1367, 1373,
18 1433, 1439, 1447, 1451, 1453, 1459, 1471, 1481, 1483, 1487, 1489, 1493, 1499, 1511, 1523, 1531, 1543, 1549, 20 1381, 1399, 1409, 1423, 1427, 1429, 1433, 1439, 1447, 1451, 1453, 1459, 1471, 1481, 1483, 1487, 1489, 1493,
19 1553, 1559, 1567, 1571, 1579, 1583, 1597, 1601, 1607, 1609, 1613, 1619, 1621, 1627, 1637, 1657, 1663, 1667, 21 1499, 1511, 1523, 1531, 1543, 1549, 1553, 1559, 1567, 1571, 1579, 1583, 1597, 1601, 1607, 1609, 1613, 1619,
20 1669, 1693, 1697, 1699, 1709, 1721, 1723, 1733, 1741, 1747, 1753, 1759, 1777, 1783, 1787, 1789, 1801, 1811, 22 1621, 1627, 1637, 1657, 1663, 1667, 1669, 1693, 1697, 1699, 1709, 1721, 1723, 1733, 1741, 1747, 1753, 1759,
21 1823, 1831, 1847, 1861, 1867, 1871, 1873, 1877, 1879, 1889, 1901, 1907, 1913, 1931, 1933, 1949, 1951, 1973, 23 1777, 1783, 1787, 1789, 1801, 1811, 1823, 1831, 1847, 1861, 1867, 1871, 1873, 1877, 1879, 1889, 1901, 1907,
22 1979, 1987, 1993, 1997, 1999, 2003, 2011, 2017, 2027, 2029, 2039, 2053, 2063, 2069, 2081, 2083, 2087, 2089, 24 1913, 1931, 1933, 1949, 1951, 1973, 1979, 1987, 1993, 1997, 1999, 2003, 2011, 2017, 2027, 2029, 2039, 2053,
23 2099, 2111, 2113, 2129, 2131, 2137, 2141, 2143, 2153, 2161, 2179, 2203, 2207, 2213, 2221, 2237, 2239, 2243, 25 2063, 2069, 2081, 2083, 2087, 2089, 2099, 2111, 2113, 2129, 2131, 2137, 2141, 2143, 2153, 2161, 2179, 2203,
24 2251, 2267, 2269, 2273, 2281, 2287, 2293, 2297, 2309, 2311, 2333, 2339, 2341, 2347, 2351, 2357, 2371, 2377, 26 2207, 2213, 2221, 2237, 2239, 2243, 2251, 2267, 2269, 2273, 2281, 2287, 2293, 2297, 2309, 2311, 2333, 2339,
25 2381, 2383, 2389, 2393, 2399, 2411, 2417, 2423, 2437, 2441, 2447, 2459, 2467, 2473, 2477, 2503, 2521, 2531, 27 2341, 2347, 2351, 2357, 2371, 2377, 2381, 2383, 2389, 2393, 2399, 2411, 2417, 2423, 2437, 2441, 2447, 2459,
26 2539, 2543, 2549, 2551, 2557, 2579, 2591, 2593, 2609, 2617, 2621, 2633, 2647, 2657, 2659, 2663, 2671, 2677, 28 2467, 2473, 2477, 2503, 2521, 2531, 2539, 2543, 2549, 2551, 2557, 2579, 2591, 2593, 2609, 2617, 2621, 2633,
27 2683, 2687, 2689, 2693, 2699, 2707, 2711, 2713, 2719, 2729, 2731, 2741, 2749, 2753, 2767, 2777, 2789, 2791, 29 2647, 2657, 2659, 2663, 2671, 2677, 2683, 2687, 2689, 2693, 2699, 2707, 2711, 2713, 2719, 2729, 2731, 2741,
28 2797, 2801, 2803, 2819, 3089, 3109, 3119, 3121, 3137, 3163, 3167, 3169, 3181, 3187, 3191, 3203, 3209, 3217, 30 2749, 2753, 2767, 2777, 2789, 2791, 2797, 2801, 2803, 2819, 3089, 3109, 3119, 3121, 3137, 3163, 3167, 3169,
29 3221, 3229, 3251, 3253, 3257, 3259, 3271, 3299, 3301, 3307, 3313, 3319, 3323, 3329, 3331, 3343, 3347, 3359, 31 3181, 3187, 3191, 3203, 3209, 3217, 3221, 3229, 3251, 3253, 3257, 3259, 3271, 3299, 3301, 3307, 3313, 3319,
30 3361, 3371, 3373, 3389, 3391, 3407, 3413, 3433, 3449, 3457, 3461, 3463, 3467, 3469, 3491, 3499, 3511, 3517, 32 3323, 3329, 3331, 3343, 3347, 3359, 3361, 3371, 3373, 3389, 3391, 3407, 3413, 3433, 3449, 3457, 3461, 3463,
31 3527, 3529, 3533, 3539, 3541, 3547, 3557, 3559, 3571, 3581, 3583, 3593, 3607, 3613, 3617, 3623, 3631, 3637, 33 3467, 3469, 3491, 3499, 3511, 3517, 3527, 3529, 3533, 3539, 3541, 3547, 3557, 3559, 3571, 3581, 3583, 3593,
32 3643, 3659, 3671, 3673, 3677, 3691, 3697, 3701, 3709, 3719, 3727, 3733, 3739, 3761, 3767, 3769, 3779, 3793, 34 3607, 3613, 3617, 3623, 3631, 3637, 3643, 3659, 3671, 3673, 3677, 3691, 3697, 3701, 3709, 3719, 3727, 3733,
33 3797, 3803, 3821, 3823, 3833, 3847, 3851, 3853, 3863, 3877, 3881, 3889, 3907, 3911 }; 35 3739, 3761, 3767, 3769, 3779, 3793, 3797, 3803, 3821, 3823, 3833, 3847, 3851, 3853, 3863, 3877, 3881, 3889,
34 36 3907, 3911 };
35 public static final long LARGEST_PRIME_30_BITS = 1073741789; 37
36 38 protected static final long LARGEST_PRIME_30_BITS_LONG = 1073741789;
37 public static final int MAX_MODEL_SIZE = (int) LARGEST_PRIME_30_BITS; 39 protected static final int LARGEST_PRIME_30_BITS_INTEGER = 1073741789;
40 protected static final int LARGEST_BINARY_INDEX_1 = LARGEST_PRIME_30_BITS_INTEGER / 4;
41 public static final int MAX_MODEL_SIZE = LARGEST_PRIME_30_BITS_INTEGER;
38 42
39 public static final TupleHashProvider INSTANCE = new TupleHashProvider(); 43 public static final TupleHashProvider INSTANCE = new TupleHashProvider();
40 44
@@ -47,15 +51,68 @@ public class TupleHashProvider implements ContinousHashProvider<Tuple> {
47 51
48 @Override 52 @Override
49 public int getHash(Tuple key, int index) { 53 public int getHash(Tuple key, int index) {
50 if (index >= primes.length) { 54 if(key instanceof Tuple1 t1) {
51 throw new IllegalArgumentException("Not enough prime numbers to support index"); 55 return t1.value0();
56 } else if(key instanceof Tuple2 t2){
57 if(index == 0) {
58 return murmur3T2(t2.value0(), t2.value1());
59 } else if(index == 1) {
60 return lagrangeT2I0Quick(t2);
61 } else if(index == 2) {
62 return lagrangeT2I1Quick(t2);
63 } else {
64 return lagrangeTXIX(key, index-1);
65 }
66 } else {
67 return lagrangeTXIX(key, index);
52 } 68 }
69
70 }
71
72 private static int lagrangeT2I0Quick(Tuple2 t2) {
73 int result = 2 * t2.value0() + t2.value1();
74 if (result > LARGEST_PRIME_30_BITS_INTEGER) {
75 return result % LARGEST_PRIME_30_BITS_INTEGER;
76 } else
77 return result;
78 }
79 private static int lagrangeT2I1Quick(Tuple2 t2) {
80 int value0 = t2.value0();
81 int value1 = t2.value1();
82 if(value0 < LARGEST_BINARY_INDEX_1 && value1 < LARGEST_BINARY_INDEX_1) {
83 return 3* value0 + value1;
84 } else {
85 return lagrangeTXIX(t2, 1);
86 }
87 }
88
89 private static int lagrangeTXIX(Tuple key, int index) {
53 long accumulator = 0; 90 long accumulator = 0;
54 final int prime = primes[index]; 91 final int prime = primes[index];
55 for (int i = 0; i < key.getSize(); i++) { 92 for (int i = 0; i < key.getSize(); i++) {
56 accumulator = (prime * accumulator + key.get(i)) % MAX_MODEL_SIZE; 93 accumulator = (prime * accumulator + key.get(i)) % LARGEST_PRIME_30_BITS_LONG;
57 } 94 }
58 95
59 return (int) accumulator; 96 return (int) accumulator;
60 } 97 }
98
99 private static int murmur3T2(int v0, int v1)
100 {
101 int h = 0;
102
103 h = murmur32Scramble(v0, h);
104 h = murmur32Scramble(v1, h);
105
106 return h;
107 }
108
109 private static int murmur32Scramble(int k, int h) {
110 k *= 0xcc9e2d51;
111 k = (k << 15) | (k >>> 17);
112 k *= 0x1b873593;
113 h ^= k;
114 h = (h << 13) | (h >>> 19);
115 h = h * 5 + 0xe6546b64;
116 return h;
117 }
61} 118}