File: OpenLongObjectHashMap.java

package info (click to toggle)
libcolt-free-java 1.2.0%2Bdfsg-7
  • links: PTS, VCS
  • area: main
  • in suites: bookworm, bullseye, buster
  • size: 20,816 kB
  • sloc: java: 30,344; xml: 896; makefile: 24; sh: 3
file content (498 lines) | stat: -rw-r--r-- 18,789 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
/*
Copyright (c) 1999 CERN - European Organization for Nuclear Research.
Permission to use, copy, modify, distribute and sell this software and its documentation for any purpose 
is hereby granted without fee, provided that the above copyright notice appear in all copies and 
that both that copyright notice and this permission notice appear in supporting documentation. 
CERN makes no representations about the suitability of this software for any purpose. 
It is provided "as is" without expressed or implied warranty.
*/
package cern.colt.map;

import cern.colt.function.LongObjectProcedure;
import cern.colt.function.LongProcedure;
import cern.colt.list.ByteArrayList;
import cern.colt.list.LongArrayList;
import cern.colt.list.ObjectArrayList;
/**
Hash map holding (key,value) associations of type <tt>(long-->Object)</tt>; Automatically grows and shrinks as needed; Implemented using open addressing with double hashing.
First see the <a href="package-summary.html">package summary</a> and javadoc <a href="package-tree.html">tree view</a> to get the broad picture.

Overrides many methods for performance reasons only.

@author wolfgang.hoschek@cern.ch
@version 1.0, 09/24/99
@see	    java.util.HashMap
*/
public class OpenLongObjectHashMap extends AbstractLongObjectMap {
	 /**
	 * The hash table keys.
	 * @serial
	 */
	protected long table[];

	 /**
	 * The hash table values.
	 * @serial
	 */
	protected Object values[];

	/**
	 * The state of each hash table entry (FREE, FULL, REMOVED).
	 * @serial
	 */
	protected byte state[];

	/**
	 * The number of table entries in state==FREE.
	 * @serial
	 */
	protected int freeEntries;
	
	
	protected static final byte FREE = 0;
	protected static final byte FULL = 1;
	protected static final byte REMOVED = 2;

/**
 * Constructs an empty map with default capacity and default load factors.
 */
public OpenLongObjectHashMap() {
	this(defaultCapacity);
}
/**
 * Constructs an empty map with the specified initial capacity and default load factors.
 *
 * @param      initialCapacity   the initial capacity of the map.
 * @throws     IllegalArgumentException if the initial capacity is less
 *             than zero.
 */
public OpenLongObjectHashMap(int initialCapacity) {
	this(initialCapacity, defaultMinLoadFactor, defaultMaxLoadFactor);
}
/**
 * Constructs an empty map with
 * the specified initial capacity and the specified minimum and maximum load factor.
 *
 * @param      initialCapacity   the initial capacity.
 * @param      minLoadFactor        the minimum load factor.
 * @param      maxLoadFactor        the maximum load factor.
 * @throws	IllegalArgumentException if <tt>initialCapacity < 0 || (minLoadFactor < 0.0 || minLoadFactor >= 1.0) || (maxLoadFactor <= 0.0 || maxLoadFactor >= 1.0) || (minLoadFactor >= maxLoadFactor)</tt>.
 */
public OpenLongObjectHashMap(int initialCapacity, double minLoadFactor, double maxLoadFactor) {
	setUp(initialCapacity,minLoadFactor,maxLoadFactor);
}
/**
 * Removes all (key,value) associations from the receiver.
 * Implicitly calls <tt>trimToSize()</tt>.
 */
public void clear() {
	new ByteArrayList(this.state).fillFromToWith(0, this.state.length-1, FREE);
   	new ObjectArrayList(values).fillFromToWith(0, state.length-1, null); // delta

	this.distinct = 0;
	this.freeEntries = table.length; // delta
	trimToSize();
}
/**
 * Returns a deep copy of the receiver.
 *
 * @return  a deep copy of the receiver.
 */
public Object clone() {
	OpenLongObjectHashMap copy = (OpenLongObjectHashMap) super.clone();
	copy.table = (long[]) copy.table.clone();
	copy.values = (Object[]) copy.values.clone();
	copy.state = (byte[]) copy.state.clone();
	return copy;
}
/**
 * Returns <tt>true</tt> if the receiver contains the specified key.
 *
 * @return <tt>true</tt> if the receiver contains the specified key.
 */
public boolean containsKey(long key) {
	return indexOfKey(key) >= 0;
}
/**
 * Returns <tt>true</tt> if the receiver contains the specified value.
 *
 * @return <tt>true</tt> if the receiver contains the specified value.
 */
public boolean containsValue(Object value) {
	return indexOfValue(value) >= 0;
}
/**
 * Ensures that the receiver can hold at least the specified number of associations without needing to allocate new internal memory.
 * If necessary, allocates new internal memory and increases the capacity of the receiver.
 * <p>
 * This method never need be called; it is for performance tuning only.
 * Calling this method before <tt>put()</tt>ing a large number of associations boosts performance,
 * because the receiver will grow only once instead of potentially many times and hash collisions get less probable.
 *
 * @param   minCapacity   the desired minimum capacity.
 */
public void ensureCapacity(int minCapacity) {
	if (table.length < minCapacity) {
		int newCapacity = nextPrime(minCapacity);
		rehash(newCapacity);
	}
}
/**
 * Applies a procedure to each key of the receiver, if any.
 * Note: Iterates over the keys in no particular order.
 * Subclasses can define a particular order, for example, "sorted by key".
 * All methods which <i>can</i> be expressed in terms of this method (most methods can) <i>must guarantee</i> to use the <i>same</i> order defined by this method, even if it is no particular order.
 * This is necessary so that, for example, methods <tt>keys</tt> and <tt>values</tt> will yield association pairs, not two uncorrelated lists.
 *
 * @param procedure    the procedure to be applied. Stops iteration if the procedure returns <tt>false</tt>, otherwise continues. 
 * @return <tt>false</tt> if the procedure stopped before all keys where iterated over, <tt>true</tt> otherwise. 
 */
public boolean forEachKey(LongProcedure procedure) {
	for (int i = table.length ; i-- > 0 ;) {
		if (state[i]==FULL) if (! procedure.apply(table[i])) return false;
	}
	return true;
}
/**
 * Applies a procedure to each (key,value) pair of the receiver, if any.
 * Iteration order is guaranteed to be <i>identical</i> to the order used by method {@link #forEachKey(LongProcedure)}.
 *
 * @param procedure    the procedure to be applied. Stops iteration if the procedure returns <tt>false</tt>, otherwise continues. 
 * @return <tt>false</tt> if the procedure stopped before all keys where iterated over, <tt>true</tt> otherwise. 
 */
public boolean forEachPair(final LongObjectProcedure procedure) {
	for (int i = table.length ; i-- > 0 ;) {
		if (state[i]==FULL) if (! procedure.apply(table[i],values[i])) return false;
	}
	return true;
}
/**
 * Returns the value associated with the specified key.
 * It is often a good idea to first check with {@link #containsKey(long)} whether the given key has a value associated or not, i.e. whether there exists an association for the given key or not.
 *
 * @param key the key to be searched for.
 * @return the value associated with the specified key; <tt>null</tt> if no such key is present.
 */
public Object get(long key) {
	int i = indexOfKey(key);
	if (i<0) return null; //not contained
	return values[i];
}
/**
 * @param key the key to be added to the receiver.
 * @return the index where the key would need to be inserted, if it is not already contained.
 * Returns -index-1 if the key is already contained at slot index.
 * Therefore, if the returned index < 0, then it is already contained at slot -index-1.
 * If the returned index >= 0, then it is NOT already contained and should be inserted at slot index.
 */
protected int indexOfInsertion(long key) {
	final long tab[] = table;
	final byte stat[] = state;
	final int length = tab.length;

	final int hash = HashFunctions.hash(key) & 0x7FFFFFFF;
	int i = hash % length;
	int decrement = hash % (length-2); // double hashing, see http://www.eece.unm.edu/faculty/heileman/hash/node4.html
	//int decrement = (hash / length) % length;
	if (decrement == 0) decrement = 1;

	// stop if we find a removed or free slot, or if we find the key itself
	// do NOT skip over removed slots (yes, open addressing is like that...)
	while (stat[i] == FULL && tab[i] != key) {
		i -= decrement;
		//hashCollisions++;
		if (i<0) i+=length;
	}
	
	if (stat[i] == REMOVED) {
		// stop if we find a free slot, or if we find the key itself.
		// do skip over removed slots (yes, open addressing is like that...)
		// assertion: there is at least one FREE slot.
		int j = i;
		while (stat[i] != FREE && (stat[i] == REMOVED || tab[i] != key)) {
			i -= decrement;
			//hashCollisions++;
			if (i<0) i+=length;
		}
		if (stat[i] == FREE) i = j;
	}
	
	
	if (stat[i] == FULL) {
		// key already contained at slot i.
		// return a negative number identifying the slot.
		return -i-1;
	}
	// not already contained, should be inserted at slot i.
	// return a number >= 0 identifying the slot.
	return i; 
}
/**
 * @param key the key to be searched in the receiver.
 * @return the index where the key is contained in the receiver, returns -1 if the key was not found.
 */
protected int indexOfKey(long key) {
	final long tab[] = table;
	final byte stat[] = state;
	final int length = tab.length;

	final int hash = HashFunctions.hash(key) & 0x7FFFFFFF;
	int i = hash % length;
	int decrement = hash % (length-2); // double hashing, see http://www.eece.unm.edu/faculty/heileman/hash/node4.html
	//int decrement = (hash / length) % length;
	if (decrement == 0) decrement = 1;

	// stop if we find a free slot, or if we find the key itself.
	// do skip over removed slots (yes, open addressing is like that...)
	while (stat[i] != FREE && (stat[i] == REMOVED || tab[i] != key)) {
		i -= decrement;
		//hashCollisions++;
		if (i<0) i+=length;
	}
	
	if (stat[i] == FREE) return -1; // not found
	return i; //found, return index where key is contained
}
/**
 * @param value the value to be searched in the receiver.
 * @return the index where the value is contained in the receiver, returns -1 if the value was not found.
 */
protected int indexOfValue(Object value) {
	final Object val[] = values;
	final byte stat[] = state;

	for (int i=stat.length; --i >= 0;) {
		if (stat[i]==FULL && val[i]==value) return i;
	}

	return -1; // not found
}
/**
 * Returns the first key the given value is associated with.
 * It is often a good idea to first check with {@link #containsValue(Object)} whether there exists an association from a key to this value.
 * Search order is guaranteed to be <i>identical</i> to the order used by method {@link #forEachKey(LongProcedure)}.
 *
 * @param value the value to search for.
 * @return the first key for which holds <tt>get(key) == value</tt>; 
 *		   returns <tt>Long.MIN_VALUE</tt> if no such key exists.
 */
public long keyOf(Object value) {
	//returns the first key found; there may be more matching keys, however.
	int i = indexOfValue(value);
	if (i<0) return Long.MIN_VALUE;
	return table[i];
}
/**
 * Fills all keys contained in the receiver into the specified list.
 * Fills the list, starting at index 0.
 * After this call returns the specified list has a new size that equals <tt>this.size()</tt>.
 * Iteration order is guaranteed to be <i>identical</i> to the order used by method {@link #forEachKey(LongProcedure)}.
 * <p>
 * This method can be used to iterate over the keys of the receiver.
 *
 * @param list the list to be filled, can have any size.
 */
public void keys(LongArrayList list) {
	list.setSize(distinct);
	long[] elements = list.elements();
	
	long[] tab = table;
	byte[] stat = state;
	
	int j=0;
	for (int i = tab.length ; i-- > 0 ;) {
		if (stat[i]==FULL) elements[j++]=tab[i];
	}
}
/**
Fills all pairs satisfying a given condition into the specified lists.
Fills into the lists, starting at index 0.
After this call returns the specified lists both have a new size, the number of pairs satisfying the condition.
Iteration order is guaranteed to be <i>identical</i> to the order used by method {@link #forEachKey(LongProcedure)}.
<p>
<b>Example:</b>
<br>
<pre>
LongObjectProcedure condition = new LongObjectProcedure() { // match even keys only
	public boolean apply(long key, Object value) { return key%2==0; }
}
keys = (8,7,6), values = (1,2,2) --> keyList = (6,8), valueList = (2,1)</tt>
</pre>

@param condition    the condition to be matched. Takes the current key as first and the current value as second argument.
@param keyList the list to be filled with keys, can have any size.
@param valueList the list to be filled with values, can have any size.
*/
public void pairsMatching(final LongObjectProcedure condition, final LongArrayList keyList, final ObjectArrayList valueList) {
	keyList.clear();
	valueList.clear();
	
	for (int i = table.length ; i-- > 0 ;) {
		if (state[i]==FULL && condition.apply(table[i],values[i])) {
			keyList.add(table[i]);
			valueList.add(values[i]);
		}
	}
}
/**
 * Associates the given key with the given value.
 * Replaces any old <tt>(key,someOtherValue)</tt> association, if existing.
 *
 * @param key the key the value shall be associated with.
 * @param value the value to be associated.
 * @return <tt>true</tt> if the receiver did not already contain such a key;
 *         <tt>false</tt> if the receiver did already contain such a key - the new value has now replaced the formerly associated value.
 */
public boolean put(long key, Object value) {
	int i = indexOfInsertion(key);	
	if (i<0) { //already contained
		i = -i -1;
		this.values[i]=value;
		return false;
	}

	if (this.distinct > this.highWaterMark) {
		int newCapacity = chooseGrowCapacity(this.distinct+1,this.minLoadFactor, this.maxLoadFactor);
		rehash(newCapacity);
		return put(key, value);
	}

	this.table[i]=key;
	this.values[i]=value;
	if (this.state[i]==FREE) this.freeEntries--;
	this.state[i]=FULL;
	this.distinct++;

	if (this.freeEntries < 1) { //delta
		int newCapacity = chooseGrowCapacity(this.distinct+1,this.minLoadFactor, this.maxLoadFactor);
		rehash(newCapacity);
	}

	return true;
}
/**
 * Rehashes the contents of the receiver into a new table
 * with a smaller or larger capacity.
 * This method is called automatically when the
 * number of keys in the receiver exceeds the high water mark or falls below the low water mark.
 */
protected void rehash(int newCapacity) {
	int oldCapacity = table.length;
	//if (oldCapacity == newCapacity) return;
	
	long oldTable[] = table;
	Object oldValues[] = values;
	byte oldState[] = state;

	long newTable[] = new long[newCapacity];
	Object newValues[] = new Object[newCapacity];
	byte newState[] = new byte[newCapacity];

	this.lowWaterMark  = chooseLowWaterMark(newCapacity,this.minLoadFactor);
	this.highWaterMark = chooseHighWaterMark(newCapacity,this.maxLoadFactor);

	this.table = newTable;
	this.values = newValues;
	this.state = newState;
	this.freeEntries = newCapacity-this.distinct; // delta
	
	for (int i = oldCapacity ; i-- > 0 ;) {
		if (oldState[i]==FULL) {
			long element = oldTable[i];
			int index = indexOfInsertion(element);
			newTable[index]=element;
			newValues[index]=oldValues[i];
			newState[index]=FULL;
		}
	}
}
/**
 * Removes the given key with its associated element from the receiver, if present.
 *
 * @param key the key to be removed from the receiver.
 * @return <tt>true</tt> if the receiver contained the specified key, <tt>false</tt> otherwise.
 */
public boolean removeKey(long key) {
	int i = indexOfKey(key);
	if (i<0) return false; // key not contained

	this.state[i]=REMOVED;
	this.values[i]=null; // delta
	this.distinct--;

	if (this.distinct < this.lowWaterMark) {
		int newCapacity = chooseShrinkCapacity(this.distinct,this.minLoadFactor, this.maxLoadFactor);
		rehash(newCapacity);
	}
	
	return true;	
}
/**
 * Initializes the receiver.
 *
 * @param      initialCapacity   the initial capacity of the receiver.
 * @param      minLoadFactor        the minLoadFactor of the receiver.
 * @param      maxLoadFactor        the maxLoadFactor of the receiver.
 * @throws	IllegalArgumentException if <tt>initialCapacity < 0 || (minLoadFactor < 0.0 || minLoadFactor >= 1.0) || (maxLoadFactor <= 0.0 || maxLoadFactor >= 1.0) || (minLoadFactor >= maxLoadFactor)</tt>.
 */
protected void setUp(int initialCapacity, double minLoadFactor, double maxLoadFactor) {
	int capacity = initialCapacity;
	super.setUp(capacity, minLoadFactor, maxLoadFactor);
	capacity = nextPrime(capacity);
	if (capacity==0) capacity=1; // open addressing needs at least one FREE slot at any time.
	
	this.table = new long[capacity];
	this.values = new Object[capacity];
	this.state = new byte[capacity];

	// memory will be exhausted long before this pathological case happens, anyway.
	this.minLoadFactor = minLoadFactor;
	if (capacity == PrimeFinder.largestPrime) this.maxLoadFactor = 1.0;
	else this.maxLoadFactor = maxLoadFactor;

	this.distinct = 0;
	this.freeEntries = capacity; // delta
	
	// lowWaterMark will be established upon first expansion.
	// establishing it now (upon instance construction) would immediately make the table shrink upon first put(...).
	// After all the idea of an "initialCapacity" implies violating lowWaterMarks when an object is young.
	// See ensureCapacity(...)
	this.lowWaterMark = 0; 
	this.highWaterMark = chooseHighWaterMark(capacity, this.maxLoadFactor);
}
/**
 * Trims the capacity of the receiver to be the receiver's current 
 * size. Releases any superfluous internal memory. An application can use this operation to minimize the 
 * storage of the receiver.
 */
public void trimToSize() {
	// * 1.2 because open addressing's performance exponentially degrades beyond that point
	// so that even rehashing the table can take very long
	int newCapacity = nextPrime((int)(1 + 1.2*size()));
	if (table.length > newCapacity) {
		rehash(newCapacity);
	}
}
/**
 * Fills all values contained in the receiver into the specified list.
 * Fills the list, starting at index 0.
 * After this call returns the specified list has a new size that equals <tt>this.size()</tt>.
 * Iteration order is guaranteed to be <i>identical</i> to the order used by method {@link #forEachKey(LongProcedure)}.
 * <p>
 * This method can be used to iterate over the values of the receiver.
 *
 * @param list the list to be filled, can have any size.
 */
public void values(ObjectArrayList list) {
	list.setSize(distinct);
	Object[] elements = list.elements();
	
	Object[] val = values;
	byte[] stat = state;
	
	int j=0;
	for (int i = stat.length ; i-- > 0 ;) {
		if (stat[i]==FULL) elements[j++]=val[i];
	}
}
}