001/*
002 * Copyright (C) 2007 The Guava Authors
003 *
004 * Licensed under the Apache License, Version 2.0 (the "License");
005 * you may not use this file except in compliance with the License.
006 * You may obtain a copy of the License at
007 *
008 * http://www.apache.org/licenses/LICENSE-2.0
009 *
010 * Unless required by applicable law or agreed to in writing, software
011 * distributed under the License is distributed on an "AS IS" BASIS,
012 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
013 * See the License for the specific language governing permissions and
014 * limitations under the License.
015 */
016
017package com.google.common.collect;
018
019import static com.google.common.base.Preconditions.checkArgument;
020import static com.google.common.base.Preconditions.checkNotNull;
021import static com.google.common.collect.CollectPreconditions.checkNonnegative;
022import static com.google.common.math.IntMath.sqrt;
023import static java.lang.Math.max;
024import static java.util.Objects.requireNonNull;
025
026import com.google.common.annotations.GwtCompatible;
027import com.google.common.annotations.GwtIncompatible;
028import com.google.common.annotations.J2ktIncompatible;
029import com.google.common.annotations.VisibleForTesting;
030import com.google.common.math.IntMath;
031import com.google.common.primitives.Ints;
032import com.google.errorprone.annotations.CanIgnoreReturnValue;
033import com.google.errorprone.annotations.concurrent.LazyInit;
034import com.google.j2objc.annotations.RetainedWith;
035import java.io.InvalidObjectException;
036import java.io.ObjectInputStream;
037import java.io.Serializable;
038import java.math.RoundingMode;
039import java.util.Arrays;
040import java.util.Collection;
041import java.util.Collections;
042import java.util.EnumSet;
043import java.util.Iterator;
044import java.util.Set;
045import java.util.SortedSet;
046import java.util.Spliterator;
047import java.util.function.Consumer;
048import java.util.stream.Collector;
049import org.jspecify.annotations.Nullable;
050
051/**
052 * A {@link Set} whose contents will never change, with many other important properties detailed at
053 * {@link ImmutableCollection}.
054 *
055 * @since 2.0
056 */
057@GwtCompatible(serializable = true, emulated = true)
058@SuppressWarnings("serial") // we're overriding default serialization
059public abstract class ImmutableSet<E> extends ImmutableCollection<E> implements Set<E> {
060  static final int SPLITERATOR_CHARACTERISTICS =
061      ImmutableCollection.SPLITERATOR_CHARACTERISTICS | Spliterator.DISTINCT;
062
063  /**
064   * Returns a {@code Collector} that accumulates the input elements into a new {@code
065   * ImmutableSet}. Elements appear in the resulting set in the encounter order of the stream; if
066   * the stream contains duplicates (according to {@link Object#equals(Object)}), only the first
067   * duplicate in encounter order will appear in the result.
068   *
069   * @since 21.0
070   */
071  public static <E> Collector<E, ?, ImmutableSet<E>> toImmutableSet() {
072    return CollectCollectors.toImmutableSet();
073  }
074
075  /**
076   * Returns the empty immutable set. Preferred over {@link Collections#emptySet} for code
077   * consistency, and because the return type conveys the immutability guarantee.
078   *
079   * <p><b>Performance note:</b> the instance returned is a singleton.
080   */
081  @SuppressWarnings({"unchecked"}) // fully variant implementation (never actually produces any Es)
082  public static <E> ImmutableSet<E> of() {
083    return (ImmutableSet<E>) RegularImmutableSet.EMPTY;
084  }
085
086  /**
087   * Returns an immutable set containing the given element. Preferred over {@link
088   * Collections#singleton} for code consistency, {@code null} rejection, and because the return
089   * type conveys the immutability guarantee.
090   */
091  public static <E> ImmutableSet<E> of(E e1) {
092    return new SingletonImmutableSet<>(e1);
093  }
094
095  /*
096   * TODO: b/315526394 - Skip the Builder entirely for the of(...) methods, since we don't need to
097   * worry that we might trigger the fallback to the JDK-backed implementation? (The varargs one
098   * _could_, so we could keep it as it is. Or we could convince ourselves that hash flooding is
099   * unlikely in practice there, too.)
100   */
101
102  /**
103   * Returns an immutable set containing the given elements, minus duplicates, in the order each was
104   * first specified. That is, if multiple elements are {@linkplain Object#equals equal}, all except
105   * the first are ignored.
106   */
107  public static <E> ImmutableSet<E> of(E e1, E e2) {
108    return new RegularSetBuilderImpl<E>(2).add(e1).add(e2).review().build();
109  }
110
111  /**
112   * Returns an immutable set containing the given elements, minus duplicates, in the order each was
113   * first specified. That is, if multiple elements are {@linkplain Object#equals equal}, all except
114   * the first are ignored.
115   */
116  public static <E> ImmutableSet<E> of(E e1, E e2, E e3) {
117    return new RegularSetBuilderImpl<E>(3).add(e1).add(e2).add(e3).review().build();
118  }
119
120  /**
121   * Returns an immutable set containing the given elements, minus duplicates, in the order each was
122   * first specified. That is, if multiple elements are {@linkplain Object#equals equal}, all except
123   * the first are ignored.
124   */
125  public static <E> ImmutableSet<E> of(E e1, E e2, E e3, E e4) {
126    return new RegularSetBuilderImpl<E>(4).add(e1).add(e2).add(e3).add(e4).review().build();
127  }
128
129  /**
130   * Returns an immutable set containing the given elements, minus duplicates, in the order each was
131   * first specified. That is, if multiple elements are {@linkplain Object#equals equal}, all except
132   * the first are ignored.
133   */
134  public static <E> ImmutableSet<E> of(E e1, E e2, E e3, E e4, E e5) {
135    return new RegularSetBuilderImpl<E>(5).add(e1).add(e2).add(e3).add(e4).add(e5).review().build();
136  }
137
138  /**
139   * Returns an immutable set containing the given elements, minus duplicates, in the order each was
140   * first specified. That is, if multiple elements are {@linkplain Object#equals equal}, all except
141   * the first are ignored.
142   *
143   * <p>The array {@code others} must not be longer than {@code Integer.MAX_VALUE - 6}.
144   *
145   * @since 3.0 (source-compatible since 2.0)
146   */
147  @SafeVarargs // For Eclipse. For internal javac we have disabled this pointless type of warning.
148  public static <E> ImmutableSet<E> of(E e1, E e2, E e3, E e4, E e5, E e6, E... others) {
149    checkArgument(
150        others.length <= Integer.MAX_VALUE - 6, "the total number of elements must fit in an int");
151    SetBuilderImpl<E> builder = new RegularSetBuilderImpl<>(6 + others.length);
152    builder = builder.add(e1).add(e2).add(e3).add(e4).add(e5).add(e6);
153    for (int i = 0; i < others.length; i++) {
154      builder = builder.add(others[i]);
155    }
156    return builder.review().build();
157  }
158
159  /**
160   * Returns an immutable set containing each of {@code elements}, minus duplicates, in the order
161   * each appears first in the source collection.
162   *
163   * <p><b>Performance note:</b> This method will sometimes recognize that the actual copy operation
164   * is unnecessary; for example, {@code copyOf(copyOf(anArrayList))} will copy the data only once.
165   * This reduces the expense of habitually making defensive copies at API boundaries. However, the
166   * precise conditions for skipping the copy operation are undefined.
167   *
168   * @throws NullPointerException if any of {@code elements} is null
169   * @since 7.0 (source-compatible since 2.0)
170   */
171  // This the best we could do to get copyOfEnumSet to compile in the mainline.
172  // The suppression also covers the cast to E[], discussed below.
173  // In the backport, we don't have those cases and thus don't need this suppression.
174  // We keep it to minimize diffs.
175  @SuppressWarnings("unchecked")
176  public static <E> ImmutableSet<E> copyOf(Collection<? extends E> elements) {
177    /*
178     * TODO(lowasser): consider checking for ImmutableAsList here
179     * TODO(lowasser): consider checking for Multiset here
180     */
181    // Don't refer to ImmutableSortedSet by name so it won't pull in all that code
182    if (elements instanceof ImmutableSet && !(elements instanceof SortedSet)) {
183      @SuppressWarnings("unchecked") // all supported methods are covariant
184      ImmutableSet<E> set = (ImmutableSet<E>) elements;
185      if (!set.isPartialView()) {
186        return set;
187      }
188    } else if (elements instanceof EnumSet) {
189      return copyOfEnumSet((EnumSet<?>) elements);
190    }
191
192    if (elements.isEmpty()) {
193      // We avoid allocating anything.
194      return of();
195    }
196    // Collection<E>.toArray() is required to contain only E instances, and all we do is read them.
197    // TODO(cpovirk): Consider using Object[] anyway.
198    E[] array = (E[]) elements.toArray();
199    /*
200     * For a Set, we guess that it contains no duplicates. That's just a guess for purpose of
201     * sizing; if the Set uses different equality semantics, it might contain duplicates according
202     * to equals(), and we will deduplicate those properly, albeit at some cost in allocations.
203     */
204    int expectedSize =
205        elements instanceof Set ? array.length : estimatedSizeForUnknownDuplication(array.length);
206    return fromArrayWithExpectedSize(array, expectedSize);
207  }
208
209  /**
210   * Returns an immutable set containing each of {@code elements}, minus duplicates, in the order
211   * each appears first in the source iterable. This method iterates over {@code elements} only
212   * once.
213   *
214   * <p><b>Performance note:</b> This method will sometimes recognize that the actual copy operation
215   * is unnecessary; for example, {@code copyOf(copyOf(anArrayList))} should copy the data only
216   * once. This reduces the expense of habitually making defensive copies at API boundaries.
217   * However, the precise conditions for skipping the copy operation are undefined.
218   *
219   * @throws NullPointerException if any of {@code elements} is null
220   */
221  public static <E> ImmutableSet<E> copyOf(Iterable<? extends E> elements) {
222    return (elements instanceof Collection)
223        ? copyOf((Collection<? extends E>) elements)
224        : copyOf(elements.iterator());
225  }
226
227  /**
228   * Returns an immutable set containing each of {@code elements}, minus duplicates, in the order
229   * each appears first in the source iterator.
230   *
231   * @throws NullPointerException if any of {@code elements} is null
232   */
233  public static <E> ImmutableSet<E> copyOf(Iterator<? extends E> elements) {
234    // We special-case for 0 or 1 elements, but anything further is madness.
235    if (!elements.hasNext()) {
236      return of();
237    }
238    E first = elements.next();
239    if (!elements.hasNext()) {
240      return of(first);
241    } else {
242      return new ImmutableSet.Builder<E>().add(first).addAll(elements).build();
243    }
244  }
245
246  /**
247   * Returns an immutable set containing each of {@code elements}, minus duplicates, in the order
248   * each appears first in the source array.
249   *
250   * @throws NullPointerException if any of {@code elements} is null
251   * @since 3.0
252   */
253  public static <E> ImmutableSet<E> copyOf(E[] elements) {
254    return fromArrayWithExpectedSize(elements, estimatedSizeForUnknownDuplication(elements.length));
255  }
256
257  private static <E> ImmutableSet<E> fromArrayWithExpectedSize(E[] elements, int expectedSize) {
258    switch (elements.length) {
259      case 0:
260        return of();
261      case 1:
262        return of(elements[0]);
263      default:
264        SetBuilderImpl<E> builder = new RegularSetBuilderImpl<>(expectedSize);
265        for (int i = 0; i < elements.length; i++) {
266          builder = builder.add(elements[i]);
267        }
268        return builder.review().build();
269    }
270  }
271
272  @SuppressWarnings({"rawtypes", "unchecked"}) // necessary to compile against Java 8
273  private static ImmutableSet copyOfEnumSet(EnumSet<?> enumSet) {
274    return ImmutableEnumSet.asImmutable(EnumSet.copyOf((EnumSet) enumSet));
275  }
276
277  ImmutableSet() {}
278
279  /** Returns {@code true} if the {@code hashCode()} method runs quickly. */
280  boolean isHashCodeFast() {
281    return false;
282  }
283
284  @Override
285  public boolean equals(@Nullable Object object) {
286    if (object == this) {
287      return true;
288    }
289    if (object instanceof ImmutableSet
290        && isHashCodeFast()
291        && ((ImmutableSet<?>) object).isHashCodeFast()
292        && hashCode() != object.hashCode()) {
293      return false;
294    }
295    return Sets.equalsImpl(this, object);
296  }
297
298  @Override
299  public int hashCode() {
300    return Sets.hashCodeImpl(this);
301  }
302
303  // This declaration is needed to make Set.iterator() and
304  // ImmutableCollection.iterator() consistent.
305  @Override
306  public abstract UnmodifiableIterator<E> iterator();
307
308  @GwtCompatible
309  abstract static class CachingAsList<E> extends ImmutableSet<E> {
310    @LazyInit @RetainedWith private transient @Nullable ImmutableList<E> asList;
311
312    @Override
313    public ImmutableList<E> asList() {
314      ImmutableList<E> result = asList;
315      if (result == null) {
316        return asList = createAsList();
317      } else {
318        return result;
319      }
320    }
321
322    ImmutableList<E> createAsList() {
323      return new RegularImmutableAsList<>(this, toArray());
324    }
325
326    // redeclare to help optimizers with b/310253115
327    @SuppressWarnings("RedundantOverride")
328    @Override
329    @J2ktIncompatible // serialization
330    @GwtIncompatible // serialization
331    Object writeReplace() {
332      return super.writeReplace();
333    }
334  }
335
336  abstract static class Indexed<E> extends CachingAsList<E> {
337    abstract E get(int index);
338
339    @Override
340    public UnmodifiableIterator<E> iterator() {
341      return asList().iterator();
342    }
343
344    @Override
345    public Spliterator<E> spliterator() {
346      return CollectSpliterators.indexed(size(), SPLITERATOR_CHARACTERISTICS, this::get);
347    }
348
349    @Override
350    public void forEach(Consumer<? super E> consumer) {
351      checkNotNull(consumer);
352      int n = size();
353      for (int i = 0; i < n; i++) {
354        consumer.accept(get(i));
355      }
356    }
357
358    @Override
359    int copyIntoArray(@Nullable Object[] dst, int offset) {
360      return asList().copyIntoArray(dst, offset);
361    }
362
363    @Override
364    ImmutableList<E> createAsList() {
365      return new ImmutableAsList<E>() {
366        @Override
367        public E get(int index) {
368          return Indexed.this.get(index);
369        }
370
371        @Override
372        Indexed<E> delegateCollection() {
373          return Indexed.this;
374        }
375
376        // redeclare to help optimizers with b/310253115
377        @SuppressWarnings("RedundantOverride")
378        @Override
379        @J2ktIncompatible // serialization
380        @GwtIncompatible // serialization
381        Object writeReplace() {
382          return super.writeReplace();
383        }
384      };
385    }
386
387    // redeclare to help optimizers with b/310253115
388    @SuppressWarnings("RedundantOverride")
389    @Override
390    @J2ktIncompatible // serialization
391    @GwtIncompatible // serialization
392    Object writeReplace() {
393      return super.writeReplace();
394    }
395  }
396
397  /*
398   * This class is used to serialize all ImmutableSet instances, except for
399   * ImmutableEnumSet/ImmutableSortedSet, regardless of implementation type. It
400   * captures their "logical contents" and they are reconstructed using public
401   * static factories. This is necessary to ensure that the existence of a
402   * particular implementation type is an implementation detail.
403   */
404  @J2ktIncompatible // serialization
405  private static class SerializedForm implements Serializable {
406    final Object[] elements;
407
408    SerializedForm(Object[] elements) {
409      this.elements = elements;
410    }
411
412    Object readResolve() {
413      return copyOf(elements);
414    }
415
416    private static final long serialVersionUID = 0;
417  }
418
419  @Override
420  @J2ktIncompatible // serialization
421  Object writeReplace() {
422    return new SerializedForm(toArray());
423  }
424
425  @J2ktIncompatible // serialization
426  private void readObject(ObjectInputStream stream) throws InvalidObjectException {
427    throw new InvalidObjectException("Use SerializedForm");
428  }
429
430  /**
431   * Returns a new builder. The generated builder is equivalent to the builder created by the {@link
432   * Builder} constructor.
433   */
434  public static <E> Builder<E> builder() {
435    return new Builder<>();
436  }
437
438  /**
439   * Returns a new builder, expecting the specified number of distinct elements to be added.
440   *
441   * <p>If {@code expectedSize} is exactly the number of distinct elements added to the builder
442   * before {@link Builder#build} is called, the builder is likely to perform better than an unsized
443   * {@link #builder()} would have.
444   *
445   * <p>It is not specified if any performance benefits apply if {@code expectedSize} is close to,
446   * but not exactly, the number of distinct elements added to the builder.
447   *
448   * @since 23.1
449   */
450  public static <E> Builder<E> builderWithExpectedSize(int expectedSize) {
451    checkNonnegative(expectedSize, "expectedSize");
452    return new Builder<>(expectedSize);
453  }
454
455  /**
456   * A builder for creating {@code ImmutableSet} instances. Example:
457   *
458   * <pre>{@code
459   * static final ImmutableSet<Color> GOOGLE_COLORS =
460   *     ImmutableSet.<Color>builder()
461   *         .addAll(WEBSAFE_COLORS)
462   *         .add(new Color(0, 191, 255))
463   *         .build();
464   * }</pre>
465   *
466   * <p>Elements appear in the resulting set in the same order they were first added to the builder.
467   *
468   * <p>Building does not change the state of the builder, so it is still possible to add more
469   * elements and to build again.
470   *
471   * @since 2.0
472   */
473  public static class Builder<E> extends ImmutableCollection.Builder<E> {
474    /*
475     * `impl` is null only for instances of the subclass, ImmutableSortedSet.Builder. That subclass
476     * overrides all the methods that access it here. Thus, all the methods here can safely assume
477     * that this field is non-null.
478     */
479    private @Nullable SetBuilderImpl<E> impl;
480    boolean forceCopy;
481
482    public Builder() {
483      this(0);
484    }
485
486    Builder(int capacity) {
487      if (capacity > 0) {
488        impl = new RegularSetBuilderImpl<>(capacity);
489      } else {
490        impl = EmptySetBuilderImpl.instance();
491      }
492    }
493
494    Builder(@SuppressWarnings("unused") boolean subclass) {
495      this.impl = null; // unused
496    }
497
498    @VisibleForTesting
499    void forceJdk() {
500      requireNonNull(impl); // see the comment on the field
501      this.impl = new JdkBackedSetBuilderImpl<>(impl);
502    }
503
504    final void copyIfNecessary() {
505      if (forceCopy) {
506        copy();
507        forceCopy = false;
508      }
509    }
510
511    void copy() {
512      requireNonNull(impl); // see the comment on the field
513      impl = impl.copy();
514    }
515
516    @Override
517    @CanIgnoreReturnValue
518    public Builder<E> add(E element) {
519      requireNonNull(impl); // see the comment on the field
520      checkNotNull(element);
521      copyIfNecessary();
522      impl = impl.add(element);
523      return this;
524    }
525
526    @Override
527    @CanIgnoreReturnValue
528    public Builder<E> add(E... elements) {
529      super.add(elements);
530      return this;
531    }
532
533    /**
534     * Adds each element of {@code elements} to the {@code ImmutableSet}, ignoring duplicate
535     * elements (only the first duplicate element is added).
536     *
537     * @param elements the elements to add
538     * @return this {@code Builder} object
539     * @throws NullPointerException if {@code elements} is null or contains a null element
540     */
541    @Override
542    @CanIgnoreReturnValue
543    public Builder<E> addAll(Iterable<? extends E> elements) {
544      super.addAll(elements);
545      return this;
546    }
547
548    @Override
549    @CanIgnoreReturnValue
550    public Builder<E> addAll(Iterator<? extends E> elements) {
551      super.addAll(elements);
552      return this;
553    }
554
555    @CanIgnoreReturnValue
556    Builder<E> combine(Builder<E> other) {
557      requireNonNull(impl);
558      requireNonNull(other.impl);
559      /*
560       * For discussion of requireNonNull, see the comment on the field.
561       *
562       * (And I don't believe there's any situation in which we call x.combine(y) when x is a plain
563       * ImmutableSet.Builder but y is an ImmutableSortedSet.Builder (or vice versa). Certainly
564       * ImmutableSortedSet.Builder.combine() is written as if its argument will never be a plain
565       * ImmutableSet.Builder: It casts immediately to ImmutableSortedSet.Builder.)
566       */
567      copyIfNecessary();
568      this.impl = this.impl.combine(other.impl);
569      return this;
570    }
571
572    @Override
573    public ImmutableSet<E> build() {
574      requireNonNull(impl); // see the comment on the field
575      forceCopy = true;
576      impl = impl.review();
577      return impl.build();
578    }
579  }
580
581  /** Swappable internal implementation of an ImmutableSet.Builder. */
582  private abstract static class SetBuilderImpl<E> {
583    // The first `distinct` elements are non-null.
584    // Since we can never access null elements, we don't mark this nullable.
585    E[] dedupedElements;
586    int distinct;
587
588    @SuppressWarnings("unchecked")
589    SetBuilderImpl(int expectedCapacity) {
590      this.dedupedElements = (E[]) new Object[expectedCapacity];
591      this.distinct = 0;
592    }
593
594    /** Initializes this SetBuilderImpl with a copy of the deduped elements array from toCopy. */
595    SetBuilderImpl(SetBuilderImpl<E> toCopy) {
596      this.dedupedElements = Arrays.copyOf(toCopy.dedupedElements, toCopy.dedupedElements.length);
597      this.distinct = toCopy.distinct;
598    }
599
600    /**
601     * Resizes internal data structures if necessary to store the specified number of distinct
602     * elements.
603     */
604    private void ensureCapacity(int minCapacity) {
605      if (minCapacity > dedupedElements.length) {
606        int newCapacity =
607            ImmutableCollection.Builder.expandedCapacity(dedupedElements.length, minCapacity);
608        dedupedElements = Arrays.copyOf(dedupedElements, newCapacity);
609      }
610    }
611
612    /** Adds e to the insertion-order array of deduplicated elements. Calls ensureCapacity. */
613    final void addDedupedElement(E e) {
614      ensureCapacity(distinct + 1);
615      dedupedElements[distinct++] = e;
616    }
617
618    /**
619     * Adds e to this SetBuilderImpl, returning the updated result. Only use the returned
620     * SetBuilderImpl, since we may switch implementations if e.g. hash flooding is detected.
621     */
622    abstract SetBuilderImpl<E> add(E e);
623
624    /** Adds all the elements from the specified SetBuilderImpl to this SetBuilderImpl. */
625    final SetBuilderImpl<E> combine(SetBuilderImpl<E> other) {
626      SetBuilderImpl<E> result = this;
627      for (int i = 0; i < other.distinct; i++) {
628        /*
629         * requireNonNull is safe because we ensure that the first `distinct` elements have been
630         * populated.
631         */
632        result = result.add(requireNonNull(other.dedupedElements[i]));
633      }
634      return result;
635    }
636
637    /**
638     * Creates a new copy of this SetBuilderImpl. Modifications to that SetBuilderImpl will not
639     * affect this SetBuilderImpl or sets constructed from this SetBuilderImpl via build().
640     */
641    abstract SetBuilderImpl<E> copy();
642
643    /**
644     * Call this before build(). Does a final check on the internal data structures, e.g. shrinking
645     * unnecessarily large structures or detecting previously unnoticed hash flooding.
646     */
647    SetBuilderImpl<E> review() {
648      return this;
649    }
650
651    abstract ImmutableSet<E> build();
652  }
653
654  private static final class EmptySetBuilderImpl<E> extends SetBuilderImpl<E> {
655    private static final EmptySetBuilderImpl<Object> INSTANCE = new EmptySetBuilderImpl<>();
656
657    @SuppressWarnings("unchecked")
658    static <E> SetBuilderImpl<E> instance() {
659      return (SetBuilderImpl<E>) INSTANCE;
660    }
661
662    private EmptySetBuilderImpl() {
663      super(0);
664    }
665
666    @Override
667    SetBuilderImpl<E> add(E e) {
668      return new RegularSetBuilderImpl<E>(Builder.DEFAULT_INITIAL_CAPACITY).add(e);
669    }
670
671    @Override
672    SetBuilderImpl<E> copy() {
673      return this;
674    }
675
676    @Override
677    ImmutableSet<E> build() {
678      return ImmutableSet.of();
679    }
680  }
681
682  // We use power-of-2 tables, and this is the highest int that's a power of 2
683  static final int MAX_TABLE_SIZE = Ints.MAX_POWER_OF_TWO;
684
685  // Represents how tightly we can pack things, as a maximum.
686  private static final double DESIRED_LOAD_FACTOR = 0.7;
687
688  // If the set has this many elements, it will "max out" the table size
689  private static final int CUTOFF = (int) (MAX_TABLE_SIZE * DESIRED_LOAD_FACTOR);
690
691  /**
692   * Returns an array size suitable for the backing array of a hash table that uses open addressing
693   * with linear probing in its implementation. The returned size is the smallest power of two that
694   * can hold setSize elements with the desired load factor. Always returns at least setSize + 2.
695   */
696  // TODO(cpovirk): Move to Hashing or something, since it's used elsewhere in the Android version.
697  static int chooseTableSize(int setSize) {
698    setSize = max(setSize, 2);
699    // Correct the size for open addressing to match desired load factor.
700    if (setSize < CUTOFF) {
701      // Round up to the next highest power of 2.
702      int tableSize = Integer.highestOneBit(setSize - 1) << 1;
703      while (tableSize * DESIRED_LOAD_FACTOR < setSize) {
704        tableSize <<= 1;
705      }
706      return tableSize;
707    }
708
709    // The table can't be completely full or we'll get infinite reprobes
710    checkArgument(setSize < MAX_TABLE_SIZE, "collection too large");
711    return MAX_TABLE_SIZE;
712  }
713
714  /**
715   * Default implementation of the guts of ImmutableSet.Builder, creating an open-addressed hash
716   * table and deduplicating elements as they come, so it only allocates O(max(distinct,
717   * expectedCapacity)) rather than O(calls to add).
718   *
719   * <p>This implementation attempts to detect hash flooding, and if it's identified, falls back to
720   * JdkBackedSetBuilderImpl.
721   */
722  private static final class RegularSetBuilderImpl<E> extends SetBuilderImpl<E> {
723    // null until at least two elements are present
724    private @Nullable Object @Nullable [] hashTable;
725    private int maxRunBeforeFallback;
726    private int expandTableThreshold;
727    private int hashCode;
728
729    RegularSetBuilderImpl(int expectedCapacity) {
730      super(expectedCapacity);
731      this.hashTable = null;
732      this.maxRunBeforeFallback = 0;
733      this.expandTableThreshold = 0;
734    }
735
736    RegularSetBuilderImpl(RegularSetBuilderImpl<E> toCopy) {
737      super(toCopy);
738      this.hashTable = (toCopy.hashTable == null) ? null : toCopy.hashTable.clone();
739      this.maxRunBeforeFallback = toCopy.maxRunBeforeFallback;
740      this.expandTableThreshold = toCopy.expandTableThreshold;
741      this.hashCode = toCopy.hashCode;
742    }
743
744    @Override
745    SetBuilderImpl<E> add(E e) {
746      checkNotNull(e);
747      if (hashTable == null) {
748        if (distinct == 0) {
749          addDedupedElement(e);
750          return this;
751        } else {
752          ensureTableCapacity(dedupedElements.length);
753          E elem = dedupedElements[0];
754          distinct--;
755          return insertInHashTable(elem).add(e);
756        }
757      }
758      return insertInHashTable(e);
759    }
760
761    private SetBuilderImpl<E> insertInHashTable(E e) {
762      requireNonNull(hashTable);
763      int eHash = e.hashCode();
764      int i0 = Hashing.smear(eHash);
765      int mask = hashTable.length - 1;
766      for (int i = i0; i - i0 < maxRunBeforeFallback; i++) {
767        int index = i & mask;
768        Object tableEntry = hashTable[index];
769        if (tableEntry == null) {
770          addDedupedElement(e);
771          hashTable[index] = e;
772          hashCode += eHash;
773          ensureTableCapacity(distinct); // rebuilds table if necessary
774          return this;
775        } else if (tableEntry.equals(e)) { // not a new element, ignore
776          return this;
777        }
778      }
779      // we fell out of the loop due to a long run; fall back to JDK impl
780      return new JdkBackedSetBuilderImpl<E>(this).add(e);
781    }
782
783    @Override
784    SetBuilderImpl<E> copy() {
785      return new RegularSetBuilderImpl<>(this);
786    }
787
788    @Override
789    SetBuilderImpl<E> review() {
790      if (hashTable == null) {
791        return this;
792      }
793      int targetTableSize = chooseTableSize(distinct);
794      if (targetTableSize * 2 < hashTable.length) {
795        hashTable = rebuildHashTable(targetTableSize, dedupedElements, distinct);
796        maxRunBeforeFallback = maxRunBeforeFallback(targetTableSize);
797        expandTableThreshold = (int) (DESIRED_LOAD_FACTOR * targetTableSize);
798      }
799      return hashFloodingDetected(hashTable) ? new JdkBackedSetBuilderImpl<E>(this) : this;
800    }
801
802    @Override
803    ImmutableSet<E> build() {
804      switch (distinct) {
805        case 0:
806          return of();
807        case 1:
808          /*
809           * requireNonNull is safe because we ensure that the first `distinct` elements have been
810           * populated.
811           */
812          return of(requireNonNull(dedupedElements[0]));
813        default:
814          /*
815           * The suppression is safe because we ensure that the first `distinct` elements have been
816           * populated.
817           */
818          @SuppressWarnings("nullness")
819          Object[] elements =
820              (distinct == dedupedElements.length)
821                  ? dedupedElements
822                  : Arrays.copyOf(dedupedElements, distinct);
823          return new RegularImmutableSet<>(
824              elements, hashCode, requireNonNull(hashTable), hashTable.length - 1);
825      }
826    }
827
828    /** Builds a new open-addressed hash table from the first n objects in elements. */
829    static @Nullable Object[] rebuildHashTable(int newTableSize, Object[] elements, int n) {
830      @Nullable Object[] hashTable = new @Nullable Object[newTableSize];
831      int mask = hashTable.length - 1;
832      for (int i = 0; i < n; i++) {
833        // requireNonNull is safe because we ensure that the first n elements have been populated.
834        Object e = requireNonNull(elements[i]);
835        int j0 = Hashing.smear(e.hashCode());
836        for (int j = j0; ; j++) {
837          int index = j & mask;
838          if (hashTable[index] == null) {
839            hashTable[index] = e;
840            break;
841          }
842        }
843      }
844      return hashTable;
845    }
846
847    void ensureTableCapacity(int minCapacity) {
848      int newTableSize;
849      if (hashTable == null) {
850        newTableSize = chooseTableSize(minCapacity);
851        hashTable = new Object[newTableSize];
852      } else if (minCapacity > expandTableThreshold && hashTable.length < MAX_TABLE_SIZE) {
853        newTableSize = hashTable.length * 2;
854        hashTable = rebuildHashTable(newTableSize, dedupedElements, distinct);
855      } else {
856        return;
857      }
858      maxRunBeforeFallback = maxRunBeforeFallback(newTableSize);
859      expandTableThreshold = (int) (DESIRED_LOAD_FACTOR * newTableSize);
860    }
861
862    /**
863     * We attempt to detect deliberate hash flooding attempts. If one is detected, we fall back to a
864     * wrapper around j.u.HashSet, which has built-in flooding protection. MAX_RUN_MULTIPLIER was
865     * determined experimentally to match our desired probability of false positives.
866     */
867    // NB: yes, this is surprisingly high, but that's what the experiments said was necessary
868    // Raising this number slows the worst-case contains behavior, speeds up hashFloodingDetected,
869    // and reduces the false-positive probability.
870    static final int MAX_RUN_MULTIPLIER = 13;
871
872    /**
873     * Checks the whole hash table for poor hash distribution. Takes O(n) in the worst case, O(n /
874     * log n) on average.
875     *
876     * <p>The online hash flooding detecting in RegularSetBuilderImpl.add can detect e.g. many
877     * exactly matching hash codes, which would cause construction to take O(n^2), but can't detect
878     * e.g. hash codes adversarially designed to go into ascending table locations, which keeps
879     * construction O(n) (as desired) but then can have O(n) queries later.
880     *
881     * <p>If this returns false, then no query can take more than O(log n).
882     *
883     * <p>Note that for a RegularImmutableSet with elements with truly random hash codes, contains
884     * operations take expected O(1) time but with high probability take O(log n) for at least some
885     * element. (https://en.wikipedia.org/wiki/Linear_probing#Analysis)
886     *
887     * <p>This method may return {@code true} even on truly random input, but {@code
888     * ImmutableSetTest} tests that the probability of that is low.
889     */
890    static boolean hashFloodingDetected(@Nullable Object[] hashTable) {
891      int maxRunBeforeFallback = maxRunBeforeFallback(hashTable.length);
892      int mask = hashTable.length - 1;
893
894      // Invariant: all elements at indices in [knownRunStart, knownRunEnd) are nonnull.
895      // If knownRunStart == knownRunEnd, this is vacuously true.
896      // When knownRunEnd exceeds hashTable.length, it "wraps", detecting runs around the end
897      // of the table.
898      int knownRunStart = 0;
899      int knownRunEnd = 0;
900
901      outerLoop:
902      while (knownRunStart < hashTable.length) {
903        if (knownRunStart == knownRunEnd && hashTable[knownRunStart] == null) {
904          if (hashTable[(knownRunStart + maxRunBeforeFallback - 1) & mask] == null) {
905            // There are only maxRunBeforeFallback - 1 elements between here and there,
906            // so even if they were all nonnull, we wouldn't detect a hash flood.  Therefore,
907            // we can skip them all.
908            knownRunStart += maxRunBeforeFallback;
909          } else {
910            knownRunStart++; // the only case in which maxRunEnd doesn't increase by mRBF
911            // happens about f * (1-f) for f = DESIRED_LOAD_FACTOR, so around 21% of the time
912          }
913          knownRunEnd = knownRunStart;
914        } else {
915          for (int j = knownRunStart + maxRunBeforeFallback - 1; j >= knownRunEnd; j--) {
916            if (hashTable[j & mask] == null) {
917              knownRunEnd = knownRunStart + maxRunBeforeFallback;
918              knownRunStart = j + 1;
919              continue outerLoop;
920            }
921          }
922          return true;
923        }
924      }
925      return false;
926    }
927
928    /**
929     * If more than this many consecutive positions are filled in a table of the specified size,
930     * report probable hash flooding. ({@link #hashFloodingDetected} may also report hash flooding
931     * if fewer consecutive positions are filled; see that method for details.)
932     */
933    static int maxRunBeforeFallback(int tableSize) {
934      return MAX_RUN_MULTIPLIER * IntMath.log2(tableSize, RoundingMode.UNNECESSARY);
935    }
936  }
937
938  /**
939   * SetBuilderImpl version that uses a JDK HashSet, which has built in hash flooding protection.
940   */
941  private static final class JdkBackedSetBuilderImpl<E> extends SetBuilderImpl<E> {
942    private final Set<Object> delegate;
943
944    JdkBackedSetBuilderImpl(SetBuilderImpl<E> toCopy) {
945      super(toCopy); // initializes dedupedElements and distinct
946      delegate = Sets.newHashSetWithExpectedSize(distinct);
947      for (int i = 0; i < distinct; i++) {
948        /*
949         * requireNonNull is safe because we ensure that the first `distinct` elements have been
950         * populated.
951         */
952        delegate.add(requireNonNull(dedupedElements[i]));
953      }
954    }
955
956    @Override
957    SetBuilderImpl<E> add(E e) {
958      checkNotNull(e);
959      if (delegate.add(e)) {
960        addDedupedElement(e);
961      }
962      return this;
963    }
964
965    @Override
966    SetBuilderImpl<E> copy() {
967      return new JdkBackedSetBuilderImpl<>(this);
968    }
969
970    @Override
971    ImmutableSet<E> build() {
972      switch (distinct) {
973        case 0:
974          return of();
975        case 1:
976          /*
977           * requireNonNull is safe because we ensure that the first `distinct` elements have been
978           * populated.
979           */
980          return of(requireNonNull(dedupedElements[0]));
981        default:
982          return new JdkBackedImmutableSet<>(
983              delegate, ImmutableList.asImmutableList(dedupedElements, distinct));
984      }
985    }
986  }
987
988  private static int estimatedSizeForUnknownDuplication(int inputElementsIncludingAnyDuplicates) {
989    if (inputElementsIncludingAnyDuplicates
990        < ImmutableCollection.Builder.DEFAULT_INITIAL_CAPACITY) {
991      return inputElementsIncludingAnyDuplicates;
992    }
993    // Guess the size is "halfway between" all duplicates and no duplicates, on a log scale.
994    return max(
995        ImmutableCollection.Builder.DEFAULT_INITIAL_CAPACITY,
996        sqrt(inputElementsIncludingAnyDuplicates, RoundingMode.CEILING));
997  }
998
999  private static final long serialVersionUID = 0xcafebabe;
1000}