Skip to content

Commit 3e39304

Browse files
XenoAmessStuart Marks
authored and
Stuart Marks
committedMar 16, 2022
8281631: HashMap copy constructor and putAll can over-allocate table
Reviewed-by: smarks
1 parent 0cf291b commit 3e39304

File tree

4 files changed

+258
-72
lines changed

4 files changed

+258
-72
lines changed
 

‎src/java.base/share/classes/java/util/HashMap.java

+7-7
Original file line numberDiff line numberDiff line change
@@ -495,9 +495,9 @@ final void putMapEntries(Map<? extends K, ? extends V> m, boolean evict) {
495495
int s = m.size();
496496
if (s > 0) {
497497
if (table == null) { // pre-size
498-
float ft = ((float)s / loadFactor) + 1.0F;
499-
int t = ((ft < (float)MAXIMUM_CAPACITY) ?
500-
(int)ft : MAXIMUM_CAPACITY);
498+
double dt = Math.ceil(s / (double)loadFactor);
499+
int t = ((dt < (double)MAXIMUM_CAPACITY) ?
500+
(int)dt : MAXIMUM_CAPACITY);
501501
if (t > threshold)
502502
threshold = tableSizeFor(t);
503503
} else {
@@ -1527,12 +1527,12 @@ private void readObject(ObjectInputStream s)
15271527
} else if (mappings == 0) {
15281528
// use defaults
15291529
} else if (mappings > 0) {
1530-
float fc = (float)mappings / lf + 1.0f;
1531-
int cap = ((fc < DEFAULT_INITIAL_CAPACITY) ?
1530+
double dc = Math.ceil(mappings / (double)lf);
1531+
int cap = ((dc < DEFAULT_INITIAL_CAPACITY) ?
15321532
DEFAULT_INITIAL_CAPACITY :
1533-
(fc >= MAXIMUM_CAPACITY) ?
1533+
(dc >= MAXIMUM_CAPACITY) ?
15341534
MAXIMUM_CAPACITY :
1535-
tableSizeFor((int)fc));
1535+
tableSizeFor((int)dc));
15361536
float ft = (float)cap * lf;
15371537
threshold = ((cap < MAXIMUM_CAPACITY && ft < MAXIMUM_CAPACITY) ?
15381538
(int)ft : Integer.MAX_VALUE);

‎src/java.base/share/classes/java/util/WeakHashMap.java

+4-6
Original file line numberDiff line numberDiff line change
@@ -213,9 +213,7 @@ public WeakHashMap(int initialCapacity, float loadFactor) {
213213
if (loadFactor <= 0 || Float.isNaN(loadFactor))
214214
throw new IllegalArgumentException("Illegal Load factor: "+
215215
loadFactor);
216-
int capacity = 1;
217-
while (capacity < initialCapacity)
218-
capacity <<= 1;
216+
int capacity = HashMap.tableSizeFor(initialCapacity);
219217
table = newTable(capacity);
220218
this.loadFactor = loadFactor;
221219
threshold = (int)(capacity * loadFactor);
@@ -251,7 +249,7 @@ public WeakHashMap() {
251249
* @since 1.3
252250
*/
253251
public WeakHashMap(Map<? extends K, ? extends V> m) {
254-
this(Math.max((int) ((float)m.size() / DEFAULT_LOAD_FACTOR + 1.0F),
252+
this(Math.max((int) Math.ceil(m.size() / (double)DEFAULT_LOAD_FACTOR),
255253
DEFAULT_INITIAL_CAPACITY),
256254
DEFAULT_LOAD_FACTOR);
257255
putAll(m);
@@ -468,7 +466,7 @@ public V put(K key, V value) {
468466
modCount++;
469467
Entry<K,V> e = tab[i];
470468
tab[i] = new Entry<>(k, value, queue, h, e);
471-
if (++size >= threshold)
469+
if (++size > threshold)
472470
resize(tab.length * 2);
473471
return null;
474472
}
@@ -557,7 +555,7 @@ public void putAll(Map<? extends K, ? extends V> m) {
557555
* to at most one extra resize.
558556
*/
559557
if (numKeysToBeAdded > threshold) {
560-
int targetCapacity = (int)(numKeysToBeAdded / loadFactor + 1);
558+
int targetCapacity = (int)Math.ceil(numKeysToBeAdded / (double)loadFactor);
561559
if (targetCapacity > MAXIMUM_CAPACITY)
562560
targetCapacity = MAXIMUM_CAPACITY;
563561
int newCapacity = table.length;

‎test/jdk/ProblemList.txt

+1
Original file line numberDiff line numberDiff line change
@@ -542,6 +542,7 @@ java/lang/invoke/LFCaching/LFMultiThreadCachingTest.java 8151492 generic-
542542
java/lang/invoke/LFCaching/LFGarbageCollectedTest.java 8078602 generic-all
543543
java/lang/invoke/lambda/LambdaFileEncodingSerialization.java 8249079 linux-x64
544544
java/lang/invoke/RicochetTest.java 8251969 generic-all
545+
java/lang/Enum/ConstantDirectoryOptimalCapacity.java 8282120 generic-all
545546

546547
############################################################################
547548

Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
/*
22
* Copyright (c) 2018, Red Hat, Inc. All rights reserved.
3+
* Copyright (c) 2022, Oracle and/or its affiliates. All rights reserved.
34
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
45
*
56
* This code is free software; you can redistribute it and/or modify it
@@ -21,113 +22,299 @@
2122
* questions.
2223
*/
2324

25+
import org.testng.annotations.DataProvider;
2426
import org.testng.annotations.Test;
2527

2628
import java.lang.invoke.MethodHandle;
2729
import java.lang.invoke.MethodHandles;
2830
import java.lang.invoke.MethodType;
2931
import java.lang.invoke.VarHandle;
32+
import java.util.AbstractMap;
33+
import java.util.AbstractSet;
34+
import java.util.ArrayList;
35+
import java.util.Arrays;
3036
import java.util.HashMap;
37+
import java.util.Iterator;
3138
import java.util.LinkedHashMap;
3239
import java.util.List;
3340
import java.util.Map;
34-
import java.util.concurrent.ThreadLocalRandom;
41+
import java.util.Set;
42+
import java.util.WeakHashMap;
43+
import java.util.function.Consumer;
3544
import java.util.function.Supplier;
36-
import java.util.stream.IntStream;
3745

38-
import static java.util.stream.Collectors.toMap;
3946
import static org.testng.Assert.assertEquals;
4047
import static org.testng.Assert.assertNull;
4148

4249
/*
4350
* @test
44-
* @bug 8210280
51+
* @bug 8210280 8281631
4552
* @modules java.base/java.util:open
46-
* @summary White box tests for HashMap internals around table resize
53+
* @summary White box tests for HashMap-related internals around table sizing
4754
* @run testng WhiteBoxResizeTest
48-
* @key randomness
4955
*/
5056
public class WhiteBoxResizeTest {
51-
final ThreadLocalRandom rnd = ThreadLocalRandom.current();
57+
5258
final MethodHandle TABLE_SIZE_FOR;
53-
final VarHandle THRESHOLD;
54-
final VarHandle TABLE;
59+
final VarHandle HM_TABLE;
60+
final VarHandle WHM_TABLE;
5561

5662
public WhiteBoxResizeTest() throws ReflectiveOperationException {
57-
Class<?> mClass = HashMap.class;
58-
String nodeClassName = mClass.getName() + "$Node";
59-
Class<?> nodeArrayClass = Class.forName("[L" + nodeClassName + ";");
60-
MethodHandles.Lookup lookup = MethodHandles.privateLookupIn(mClass, MethodHandles.lookup());
61-
TABLE = lookup.findVarHandle(mClass, "table", nodeArrayClass);
62-
this.TABLE_SIZE_FOR = lookup.findStatic(
63-
mClass, "tableSizeFor",
64-
MethodType.methodType(int.class, int.class));
65-
this.THRESHOLD = lookup.findVarHandle(mClass, "threshold", int.class);
63+
MethodHandles.Lookup hmlookup = MethodHandles.privateLookupIn(HashMap.class, MethodHandles.lookup());
64+
TABLE_SIZE_FOR = hmlookup.findStatic(
65+
HashMap.class, "tableSizeFor", MethodType.methodType(int.class, int.class));
66+
HM_TABLE = hmlookup.unreflectVarHandle(HashMap.class.getDeclaredField("table"));
67+
68+
MethodHandles.Lookup whmlookup = MethodHandles.privateLookupIn(WeakHashMap.class, MethodHandles.lookup());
69+
WHM_TABLE = whmlookup.unreflectVarHandle(WeakHashMap.class.getDeclaredField("table"));
6670
}
6771

72+
/*
73+
* utility methods
74+
*/
75+
6876
int tableSizeFor(int n) {
6977
try {
7078
return (int) TABLE_SIZE_FOR.invoke(n);
71-
} catch (Throwable t) { throw new AssertionError(t); }
79+
} catch (Throwable t) {
80+
throw new AssertionError(t);
81+
}
7282
}
7383

74-
Object[] table(HashMap map) {
84+
Object[] table(Map<?, ?> map) {
7585
try {
76-
return (Object[]) TABLE.get(map);
77-
} catch (Throwable t) { throw new AssertionError(t); }
86+
VarHandle vh = map instanceof WeakHashMap ? WHM_TABLE : HM_TABLE;
87+
return (Object[]) vh.get(map);
88+
} catch (Throwable t) {
89+
throw new AssertionError(t);
90+
}
7891
}
7992

80-
int capacity(HashMap map) {
93+
int capacity(Map<?, ?> map) {
8194
return table(map).length;
8295
}
8396

84-
@Test
85-
public void testTableSizeFor() {
86-
assertEquals(tableSizeFor(0), 1);
87-
assertEquals(tableSizeFor(1), 1);
88-
assertEquals(tableSizeFor(2), 2);
89-
assertEquals(tableSizeFor(3), 4);
90-
assertEquals(tableSizeFor(15), 16);
91-
assertEquals(tableSizeFor(16), 16);
92-
assertEquals(tableSizeFor(17), 32);
93-
int maxSize = 1 << 30;
94-
assertEquals(tableSizeFor(maxSize - 1), maxSize);
95-
assertEquals(tableSizeFor(maxSize), maxSize);
96-
assertEquals(tableSizeFor(maxSize + 1), maxSize);
97-
assertEquals(tableSizeFor(Integer.MAX_VALUE), maxSize);
97+
// creates a map with size mappings
98+
Map<String, String> makeMap(int size) {
99+
Map<String, String> map = new HashMap<>();
100+
putN(map, size);
101+
return map;
102+
}
103+
104+
// creates a "fake" map: size() returns the given size, but
105+
// the entrySet iterator returns only one entry
106+
Map<String, String> fakeMap(int size) {
107+
return new AbstractMap<>() {
108+
public Set<Map.Entry<String, String>> entrySet() {
109+
return new AbstractSet<Map.Entry<String, String>>() {
110+
public int size() {
111+
return size;
112+
}
113+
114+
public Iterator<Map.Entry<String, String>> iterator() {
115+
return Set.of(Map.entry("1", "1")).iterator();
116+
}
117+
};
118+
}
119+
};
120+
}
121+
122+
void putN(Map<String, String> map, int n) {
123+
for (int i = 0; i < n; i++) {
124+
String string = Integer.toString(i);
125+
map.put(string, string);
126+
}
127+
}
128+
129+
/*
130+
* tests of tableSizeFor
131+
*/
132+
133+
@DataProvider(name = "tableSizeFor")
134+
public Object[][] tableSizeForCases() {
135+
final int MAX = 1 << 30;
136+
return new Object[][] {
137+
// tableSizeFor(arg), expected
138+
{ 0, 1 },
139+
{ 1, 1 },
140+
{ 2, 2 },
141+
{ 3, 4 },
142+
{ 4, 4 },
143+
{ 5, 8 },
144+
{ 15, 16 },
145+
{ 16, 16 },
146+
{ 17, 32 },
147+
{ MAX-1, MAX },
148+
{ MAX, MAX },
149+
{ MAX+1, MAX },
150+
{ Integer.MAX_VALUE, MAX }
151+
};
152+
}
153+
154+
@Test(dataProvider = "tableSizeFor")
155+
public void tableSizeFor(int arg, int expected) {
156+
assertEquals(tableSizeFor(arg), expected);
98157
}
99158

100-
@Test
101-
public void capacityTestDefaultConstructor() {
102-
capacityTestDefaultConstructor(new HashMap<>());
103-
capacityTestDefaultConstructor(new LinkedHashMap<>());
159+
/*
160+
* tests for lazy table allocation
161+
*/
162+
163+
@DataProvider(name = "lazy")
164+
public Object[][] lazyTableAllocationCases() {
165+
return new Object[][]{
166+
{new HashMap<>()},
167+
// { new WeakHashMap<>() }, // WHM doesn't allocate lazily
168+
{new LinkedHashMap<>()}
169+
};
104170
}
105171

106-
void capacityTestDefaultConstructor(HashMap<Integer, Integer> map) {
172+
@Test(dataProvider = "lazy")
173+
public void lazyTableAllocation(Map<?, ?> map) {
107174
assertNull(table(map));
175+
}
108176

109-
map.put(1, 1);
110-
assertEquals(capacity(map), 16); // default initial capacity
177+
/*
178+
* tests for default capacity (no-arg constructor)
179+
*/
111180

112-
map.putAll(IntStream.range(0, 64).boxed().collect(toMap(i -> i, i -> i)));
113-
assertEquals(capacity(map), 128);
181+
@DataProvider(name = "defaultCapacity")
182+
public Object[][] defaultCapacityCases() {
183+
return new Supplier<?>[][]{
184+
{() -> new HashMap<>()},
185+
{() -> new LinkedHashMap<>()},
186+
{() -> new WeakHashMap<>()}
187+
};
114188
}
115189

116-
@Test
117-
public void capacityTestInitialCapacity() {
118-
int initialCapacity = rnd.nextInt(2, 128);
119-
List<Supplier<HashMap<Integer, Integer>>> suppliers = List.of(
120-
() -> new HashMap<>(initialCapacity),
121-
() -> new HashMap<>(initialCapacity, 0.75f),
122-
() -> new LinkedHashMap<>(initialCapacity),
123-
() -> new LinkedHashMap<>(initialCapacity, 0.75f));
190+
@Test(dataProvider = "defaultCapacity")
191+
public void defaultCapacity(Supplier<Map<String, String>> s) {
192+
Map<String, String> map = s.get();
193+
map.put("", "");
194+
assertEquals(capacity(map), 16);
195+
}
124196

125-
for (Supplier<HashMap<Integer, Integer>> supplier : suppliers) {
126-
HashMap<Integer, Integer> map = supplier.get();
127-
assertNull(table(map));
197+
/*
198+
* tests for requested capacity (int and int+float constructors)
199+
*/
128200

129-
map.put(1, 1);
130-
assertEquals(capacity(map), tableSizeFor(initialCapacity));
201+
@DataProvider(name = "requestedCapacity")
202+
public Iterator<Object[]> requestedCapacityCases() {
203+
ArrayList<Object[]> cases = new ArrayList<>();
204+
for (int i = 2; i < 128; i++) {
205+
int cap = i;
206+
cases.add(new Object[]{"rhm1", cap, (Supplier<Map<String, String>>) () -> new HashMap<>(cap)});
207+
cases.add(new Object[]{"rhm2", cap, (Supplier<Map<String, String>>) () -> new HashMap<>(cap, 0.75f)});
208+
cases.add(new Object[]{"rlm1", cap, (Supplier<Map<String, String>>) () -> new LinkedHashMap<>(cap)});
209+
cases.add(new Object[]{"rlm2", cap, (Supplier<Map<String, String>>) () -> new LinkedHashMap<>(cap, 0.75f)});
210+
cases.add(new Object[]{"rwm1", cap, (Supplier<Map<String, String>>) () -> new WeakHashMap<>(cap)});
211+
cases.add(new Object[]{"rwm2", cap, (Supplier<Map<String, String>>) () -> new WeakHashMap<>(cap, 0.75f)});
131212
}
213+
return cases.iterator();
214+
}
215+
216+
@Test(dataProvider = "requestedCapacity")
217+
public void requestedCapacity(String label, int cap, Supplier<Map<String, String>> s) {
218+
Map<String, String> map = s.get();
219+
map.put("", "");
220+
assertEquals(capacity(map), tableSizeFor(cap));
221+
}
222+
223+
/*
224+
* Tests for capacity after map is populated with a given number N of mappings.
225+
* Maps are populated using a copy constructor on a map with N mappings,
226+
* other constructors followed by N put() calls, and other constructors followed
227+
* by putAll() on a map with N mappings.
228+
*
229+
* String labels encode the test case for ease of diagnosis if one of the test cases fails.
230+
* For example, "plm2pn" is "populated LinkedHashMap, 2-arg constructor, followed by putN".
231+
*/
232+
233+
// helper method for one populated capacity case, to provide target types for lambdas
234+
Object[] pcc(String label,
235+
int size,
236+
int expectedCapacity,
237+
Supplier<Map<String, String>> supplier,
238+
Consumer<Map<String, String>> consumer) {
239+
return new Object[]{label, size, expectedCapacity, supplier, consumer};
240+
}
241+
242+
List<Object[]> genPopulatedCapacityCases(int size, int cap) {
243+
return Arrays.asList(
244+
pcc("phmcpy", size, cap, () -> new HashMap<>(makeMap(size)), map -> { }),
245+
pcc("phm0pn", size, cap, () -> new HashMap<>(), map -> { putN(map, size); }),
246+
pcc("phm1pn", size, cap, () -> new HashMap<>(cap), map -> { putN(map, size); }),
247+
pcc("phm2pn", size, cap, () -> new HashMap<>(cap, 0.75f), map -> { putN(map, size); }),
248+
pcc("phm0pa", size, cap, () -> new HashMap<>(), map -> { map.putAll(makeMap(size)); }),
249+
pcc("phm1pa", size, cap, () -> new HashMap<>(cap), map -> { map.putAll(makeMap(size)); }),
250+
pcc("phm2pa", size, cap, () -> new HashMap<>(cap, 0.75f), map -> { map.putAll(makeMap(size)); }),
251+
252+
pcc("plmcpy", size, cap, () -> new LinkedHashMap<>(makeMap(size)), map -> { }),
253+
pcc("plm0pn", size, cap, () -> new LinkedHashMap<>(), map -> { putN(map, size); }),
254+
pcc("plm1pn", size, cap, () -> new LinkedHashMap<>(cap), map -> { putN(map, size); }),
255+
pcc("plm2pn", size, cap, () -> new LinkedHashMap<>(cap, 0.75f), map -> { putN(map, size); }),
256+
pcc("plm0pa", size, cap, () -> new LinkedHashMap<>(), map -> { map.putAll(makeMap(size)); }),
257+
pcc("plm1pa", size, cap, () -> new LinkedHashMap<>(cap), map -> { map.putAll(makeMap(size)); }),
258+
pcc("plm2pa", size, cap, () -> new LinkedHashMap<>(cap, 0.75f), map -> { map.putAll(makeMap(size)); }),
259+
260+
pcc("pwmcpy", size, cap, () -> new WeakHashMap<>(makeMap(size)), map -> { }),
261+
pcc("pwm0pn", size, cap, () -> new WeakHashMap<>(), map -> { putN(map, size); }),
262+
pcc("pwm1pn", size, cap, () -> new WeakHashMap<>(cap), map -> { putN(map, size); }),
263+
pcc("pwm2pn", size, cap, () -> new WeakHashMap<>(cap, 0.75f), map -> { putN(map, size); }),
264+
pcc("pwm0pa", size, cap, () -> new WeakHashMap<>(), map -> { map.putAll(makeMap(size)); }),
265+
pcc("pwm1pa", size, cap, () -> new WeakHashMap<>(cap), map -> { map.putAll(makeMap(size)); }),
266+
pcc("pwm2pa", size, cap, () -> new WeakHashMap<>(cap, 0.75f), map -> { map.putAll(makeMap(size)); })
267+
);
268+
}
269+
270+
List<Object[]> genFakePopulatedCapacityCases(int size, int cap) {
271+
return Arrays.asList(
272+
pcc("fhmcpy", size, cap, () -> new HashMap<>(fakeMap(size)), map -> { }),
273+
pcc("fhm0pa", size, cap, () -> new HashMap<>(), map -> { map.putAll(fakeMap(size)); }),
274+
pcc("fhm1pa", size, cap, () -> new HashMap<>(cap), map -> { map.putAll(fakeMap(size)); }),
275+
pcc("fhm2pa", size, cap, () -> new HashMap<>(cap, 0.75f), map -> { map.putAll(fakeMap(size)); }),
276+
277+
pcc("flmcpy", size, cap, () -> new LinkedHashMap<>(fakeMap(size)), map -> { }),
278+
pcc("flm0pa", size, cap, () -> new LinkedHashMap<>(), map -> { map.putAll(fakeMap(size)); }),
279+
pcc("flm1pa", size, cap, () -> new LinkedHashMap<>(cap), map -> { map.putAll(fakeMap(size)); }),
280+
pcc("flm2pa", size, cap, () -> new LinkedHashMap<>(cap, 0.75f), map -> { map.putAll(fakeMap(size)); }),
281+
282+
pcc("fwmcpy", size, cap, () -> new WeakHashMap<>(fakeMap(size)), map -> { }),
283+
// pcc("fwm0pa", size, cap, () -> new WeakHashMap<>(), map -> { map.putAll(fakeMap(size)); }), // see note
284+
pcc("fwm1pa", size, cap, () -> new WeakHashMap<>(cap), map -> { map.putAll(fakeMap(size)); }),
285+
pcc("fwm2pa", size, cap, () -> new WeakHashMap<>(cap, 0.75f), map -> { map.putAll(fakeMap(size)); })
286+
);
287+
288+
// Test case "fwm0pa" is commented out because WeakHashMap uses a different allocation
289+
// policy from the other map implementations: it deliberately under-allocates in this case.
290+
}
291+
292+
@DataProvider(name = "populatedCapacity")
293+
public Iterator<Object[]> populatedCapacityCases() {
294+
ArrayList<Object[]> cases = new ArrayList<>();
295+
cases.addAll(genPopulatedCapacityCases(11, 16));
296+
cases.addAll(genPopulatedCapacityCases(12, 16));
297+
cases.addAll(genPopulatedCapacityCases(13, 32));
298+
cases.addAll(genPopulatedCapacityCases(64, 128));
299+
300+
// numbers in this range are truncated by a float computation with 0.75f
301+
// but can get an exact result with a double computation with 0.75d
302+
cases.addAll(genFakePopulatedCapacityCases(25165824, 33554432));
303+
cases.addAll(genFakePopulatedCapacityCases(25165825, 67108864));
304+
cases.addAll(genFakePopulatedCapacityCases(25165826, 67108864));
305+
306+
return cases.iterator();
132307
}
308+
309+
@Test(dataProvider = "populatedCapacity")
310+
public void populatedCapacity(String label, // unused, included for diagnostics
311+
int size, // unused, included for diagnostics
312+
int expectedCapacity,
313+
Supplier<Map<String, String>> s,
314+
Consumer<Map<String, String>> c) {
315+
Map<String, String> map = s.get();
316+
c.accept(map);
317+
assertEquals(capacity(map), expectedCapacity);
318+
}
319+
133320
}

1 commit comments

Comments
 (1)

openjdk-notifier[bot] commented on Mar 16, 2022

@openjdk-notifier[bot]
Please sign in to comment.