/* Copyright (c) 2003-2006 Niels Kokholm and Peter Sestoft Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ #define LINEARPROBINGnot #define REFBUCKET #define SHRINKnot #define INTERHASHINGnot #define RANDOMINTERHASHING using System; using System.Diagnostics; using SCG = System.Collections.Generic; namespace C5 { /// /// A set collection class based on linear hashing /// [Serializable] public class HashSet : CollectionBase, ICollection { #region Feature /// /// Enum class to assist printing of compilation alternatives. /// [Flags] public enum Feature : short { /// /// Nothing /// Dummy = 0, /// /// Buckets are of reference type /// RefTypeBucket = 1, /// /// Primary buckets are of value type /// ValueTypeBucket = 2, /// /// Using linear probing to resolve index clashes /// LinearProbing = 4, /// /// Shrink table when very sparsely filled /// ShrinkTable = 8, /// /// Use chaining to resolve index clashes /// Chaining = 16, /// /// Use hash function on item hash code /// InterHashing = 32, /// /// Use a universal family of hash functions on item hash code /// RandomInterHashing = 64 } static Feature features = Feature.Dummy #if REFBUCKET | Feature.RefTypeBucket #else | Feature.ValueTypeBucket #endif #if SHRINK | Feature.ShrinkTable #endif #if LINEARPROBING | Feature.LinearProbing #else | Feature.Chaining #endif #if INTERHASHING | Feature.InterHashing #elif RANDOMINTERHASHING | Feature.RandomInterHashing #endif ; /// /// Show which implementation features was chosen at compilation time /// public static Feature Features { get { return features; } } #endregion #region Fields int indexmask, bits, bitsc, origbits, lastchosen; //bitsc==32-bits; indexmask==(1< /// /// /// public override EventTypeEnum ListenableEvents { get { return EventTypeEnum.Basic; } } #endregion #region Bucket nested class(es) #if REFBUCKET [Serializable] class Bucket { internal T item; internal int hashval; //Cache! #if LINEARPROBING internal Bucket(T item, int hashval) { this.item = item; this.hashval = hashval; } #else internal Bucket overflow; internal Bucket(T item, int hashval, Bucket overflow) { this.item = item; this.hashval = hashval; this.overflow = overflow; } #endif } #else struct Bucket { internal T item; internal int hashval; //Cache! #if LINEARPROBING internal Bucket(T item, int hashval) { this.item = item; this.hashval = hashval; } #else internal OverflowBucket overflow; internal Bucket(T item, int hashval) { this.item = item; this.hashval = hashval; this.overflow = default(OverflowBucket); } #endif } #if !LINEARPROBING class OverflowBucket { internal T item; internal int hashval; //Cache! internal OverflowBucket overflow; internal OverflowBucket(T item, int hashval, OverflowBucket overflow) { this.item = item; this.hashval = hashval; this.overflow = overflow; } } #endif #endif #endregion #region Basic Util bool equals(T i1, T i2) { return itemequalityComparer.Equals(i1, i2); } #if !REFBUCKET bool isnull(T item) { return itemequalityComparer.Equals(item, default(T)); } #endif int gethashcode(T item) { return itemequalityComparer.GetHashCode(item); } int hv2i(int hashval) { #if INTERHASHING //Note: *inverse mod 2^32 is -1503427877 return (int)(((uint)hashval * 1529784659) >>bitsc); #elif RANDOMINTERHASHING return (int)(((uint)hashval * randomhashfactor) >> bitsc); #else return indexmask & hashval; #endif } void expand() { //Console.WriteLine(String.Format("Expand to {0} bits", bits+1)); resize(bits + 1); } void shrink() { if (bits > 3) { //Console.WriteLine(String.Format("Shrink to {0} bits", bits - 1)); resize(bits - 1); } } void resize(int bits) { //Console.WriteLine(String.Format("Resize to {0} bits", bits)); this.bits = bits; bitsc = 32 - bits; indexmask = (1 << bits) - 1; Bucket[] newtable = new Bucket[indexmask + 1]; for (int i = 0, s = table.Length; i < s; i++) { Bucket b = table[i]; #if LINEARPROBING #if REFBUCKET if (b != null) { int j = hv2i(b.hashval); while (newtable[j] != null) { j = indexmask & (j + 1); } newtable[j] = b; } #else if (!isnull(b.item)) { int j = hv2i(b.hashval); while (!isnull(newtable[j].item)) { j = indexmask & (j + 1); } newtable[j] = b; } #endif #else #if REFBUCKET while (b != null) { int j = hv2i(b.hashval); newtable[j] = new Bucket(b.item, b.hashval, newtable[j]); b = b.overflow; } #else if (!isnull(b.item)) { insert(b.item, b.hashval, newtable); OverflowBucket ob = b.overflow; while (ob != null) { insert(ob.item, ob.hashval, newtable); ob = ob.overflow; } } #endif #endif } table = newtable; resizethreshhold = (int)(table.Length * fillfactor); //Console.WriteLine(String.Format("Resize to {0} bits done", bits)); } #if REFBUCKET #else #if LINEARPROBING #else //Only for resize!!! private void insert(T item, int hashval, Bucket[] t) { int i = hv2i(hashval); Bucket b = t[i]; if (!isnull(b.item)) { t[i].overflow = new OverflowBucket(item, hashval, b.overflow); } else t[i] = new Bucket(item, hashval); } #endif #endif /// /// Search for an item equal (according to itemequalityComparer) to the supplied item. /// /// /// If true, add item to table if not found. /// If true, update table entry if item found. /// If true raise events /// True if found private bool searchoradd(ref T item, bool add, bool update, bool raise) { #if LINEARPROBING #if REFBUCKET int hashval = gethashcode(item); int i = hv2i(hashval); Bucket b = table[i]; while (b != null) { T olditem = b.item; if (equals(olditem, item)) { if (update) b.item = item; else item = olditem; if (raise && update) raiseForUpdate(item, olditem); return true; } b = table[i = indexmask & (i + 1)]; } if (!add) goto notfound; table[i] = new Bucket(item, hashval); #else if (isnull(item)) { if (defaultvalid) { T olditem = defaultitem; if (update) defaultitem = item; else item = defaultitem; if (raise && update) raiseForUpdate(item, olditem); return true; } if (!add) goto notfound; defaultvalid = true; defaultitem = item; } else { int hashval = gethashcode(item); int i = hv2i(hashval); T t = table[i].item; while (!isnull(t)) { if (equals(t, item)) { if (update) table[i].item = item; else item = t; if (raise && update) raiseForUpdate(item, t); return true; } t = table[i = indexmask & (i + 1)].item; } if (!add) goto notfound; table[i] = new Bucket(item, hashval); } #endif #else #if REFBUCKET int hashval = gethashcode(item); int i = hv2i(hashval); Bucket b = table[i], bold = null; if (b != null) { while (b != null) { T olditem = b.item; if (equals(olditem, item)) { if (update) { b.item = item; } if (raise && update) raiseForUpdate(item, olditem); // bug20071112: item = olditem; return true; } bold = b; b = b.overflow; } if (!add) goto notfound; bold.overflow = new Bucket(item, hashval, null); } else { if (!add) goto notfound; table[i] = new Bucket(item, hashval, null); } #else if (isnull(item)) { if (defaultvalid) { T olditem = defaultitem; if (update) defaultitem = item; else item = defaultitem; if (raise && update) raiseForUpdate(item, olditem); return true; } if (!add) goto notfound; defaultvalid = true; defaultitem = item; } else { int hashval = gethashcode(item); int i = hv2i(hashval); Bucket b = table[i]; if (!isnull(b.item)) { if (equals(b.item, item)) { if (update) table[i].item = item; else item = b.item; if (raise && update) raiseForUpdate(item, b.item); return true; } OverflowBucket ob = table[i].overflow; if (ob == null) { if (!add) goto notfound; table[i].overflow = new OverflowBucket(item, hashval, null); } else { T olditem = ob.item; while (ob.overflow != null) { if (equals(item, olditem)) { if (update) ob.item = item; else item = olditem; if (raise && update) raiseForUpdate(item, olditem); return true; } ob = ob.overflow; olditem = ob.item; } if (equals(item, olditem)) { if (update) ob.item = item; else item = olditem; if (raise && update) raiseForUpdate(item, olditem); return true; } if (!add) goto notfound; ob.overflow = new OverflowBucket(item, hashval, null); } } else { if (!add) goto notfound; table[i] = new Bucket(item, hashval); } } #endif #endif size++; if (size > resizethreshhold) expand(); notfound: if (raise && add) raiseForAdd(item); if (update) item = default(T); return false; } private bool remove(ref T item) { if (size == 0) return false; #if LINEARPROBING #if REFBUCKET int hashval = gethashcode(item); int index = hv2i(hashval); Bucket b = table[index]; while (b != null) { if (equals(item, b.item)) { //ref item = table[index].item; table[index] = null; //Algorithm R int j = (index + 1) & indexmask; b = table[j]; while (b != null) { int k = hv2i(b.hashval); if ((k <= index && index < j) || (index < j && j < k) || (j < k && k <= index)) //if (index > j ? (j < k && k <= index): (k <= index || j < k) ) { table[index] = b; table[j] = null; index = j; } j = (j + 1) & indexmask; b = table[j]; } goto found; } b = table[index = indexmask & (index + 1)]; } return false; #else if (isnull(item)) { if (!defaultvalid) return false; //ref item = defaultitem; defaultvalid = false; defaultitem = default(T); //No spaceleaks! } else { int hashval = gethashcode(item); int index = hv2i(hashval); T t = table[index].item; while (!isnull(t)) { if (equals(item, t)) { //ref item = table[index].item; table[index].item = default(T); //algorithm R int j = (index + 1) & indexmask; Bucket b = table[j]; while (!isnull(b.item)) { int k = hv2i(b.hashval); if ((k <= index && index < j) || (index < j && j < k) || (j < k && k <= index)) { table[index] = b; table[j].item = default(T); index = j; } j = (j + 1) & indexmask; b = table[j]; } goto found; } t = table[index = indexmask & (index + 1)].item; } return false; } #endif found: #else #if REFBUCKET int hashval = gethashcode(item); int index = hv2i(hashval); Bucket b = table[index], bold; if (b == null) return false; if (equals(item, b.item)) { //ref item = b.item; table[index] = b.overflow; } else { bold = b; b = b.overflow; while (b != null && !equals(item, b.item)) { bold = b; b = b.overflow; } if (b == null) return false; //ref item = b.item; bold.overflow = b.overflow; } #else if (isnull(item)) { if (!defaultvalid) return false; //ref item = defaultitem; defaultvalid = false; defaultitem = default(T); //No spaceleaks! } else { int hashval = gethashcode(item); int index = hv2i(hashval); Bucket b = table[index]; OverflowBucket ob = b.overflow; if (equals(item, b.item)) { //ref item = b.item; if (ob == null) { table[index] = new Bucket(); } else { b = new Bucket(ob.item, ob.hashval); b.overflow = ob.overflow; table[index] = b; } } else { if (ob == null) return false; if (equals(item, ob.item)) { //ref item=ob.item; table[index].overflow = ob.overflow; } else { while (ob.overflow != null) if (equals(item, ob.overflow.item)) { //ref item = ob.overflow.item; break; } else ob = ob.overflow; if (ob.overflow == null) return false; ob.overflow = ob.overflow.overflow; } } } #endif #endif size--; return true; } private void clear() { bits = origbits; bitsc = 32 - bits; indexmask = (1 << bits) - 1; size = 0; table = new Bucket[indexmask + 1]; resizethreshhold = (int)(table.Length * fillfactor); #if !REFBUCKET defaultitem = default(T); defaultvalid = false; #endif } #endregion #region Constructors /// /// Create a hash set with natural item equalityComparer and default fill threshold (66%) /// and initial table size (16). /// public HashSet() : this(EqualityComparer.Default) { } /// /// Create a hash set with external item equalityComparer and default fill threshold (66%) /// and initial table size (16). /// /// The external item equalityComparer public HashSet(SCG.IEqualityComparer itemequalityComparer) : this(16, itemequalityComparer) { } /// /// Create a hash set with external item equalityComparer and default fill threshold (66%) /// /// Initial table size (rounded to power of 2, at least 16) /// The external item equalityComparer public HashSet(int capacity, SCG.IEqualityComparer itemequalityComparer) : this(capacity, 0.66, itemequalityComparer) { } /// /// Create a hash set with external item equalityComparer. /// /// Initial table size (rounded to power of 2, at least 16) /// Fill threshold (in range 10% to 90%) /// The external item equalityComparer public HashSet(int capacity, double fill, SCG.IEqualityComparer itemequalityComparer) : base(itemequalityComparer) { if (fill < 0.1 || fill > 0.9) throw new ArgumentException("Fill outside valid range [0.1, 0.9]"); if (capacity <= 0) throw new ArgumentException("Capacity must be non-negative"); //this.itemequalityComparer = itemequalityComparer; origbits = 4; while (capacity - 1 >> origbits > 0) origbits++; clear(); } #endregion #region IEditableCollection Members /// /// The complexity of the Contains operation /// /// Always returns Speed.Constant [Tested] public virtual Speed ContainsSpeed { [Tested]get { return Speed.Constant; } } /// /// Check if an item is in the set /// /// The item to look for /// True if set contains item [Tested] public virtual bool Contains(T item) { return searchoradd(ref item, false, false, false); } /// /// Check if an item (collection equal to a given one) is in the set and /// if so report the actual item object found. /// /// On entry, the item to look for. /// On exit the item found, if any /// True if set contains item [Tested] public virtual bool Find(ref T item) { return searchoradd(ref item, false, false, false); } /// /// Check if an item (collection equal to a given one) is in the set and /// if so replace the item object in the set with the supplied one. /// /// The item object to update with /// True if item was found (and updated) [Tested] public virtual bool Update(T item) { updatecheck(); return searchoradd(ref item, false, true, true); } /// /// Check if an item (collection equal to a given one) is in the set and /// if so replace the item object in the set with the supplied one. /// /// The item object to update with /// /// True if item was found (and updated) public virtual bool Update(T item, out T olditem) { updatecheck(); olditem = item; return searchoradd(ref olditem, false, true, true); } /// /// Check if an item (collection equal to a given one) is in the set. /// If found, report the actual item object in the set, /// else add the supplied one. /// /// On entry, the item to look for or add. /// On exit the actual object found, if any. /// True if item was found [Tested] public virtual bool FindOrAdd(ref T item) { updatecheck(); return searchoradd(ref item, true, false, true); } /// /// Check if an item (collection equal to a supplied one) is in the set and /// if so replace the item object in the set with the supplied one; else /// add the supplied one. /// /// The item to look for and update or add /// True if item was updated [Tested] public virtual bool UpdateOrAdd(T item) { updatecheck(); return searchoradd(ref item, true, true, true); } /// /// Check if an item (collection equal to a supplied one) is in the set and /// if so replace the item object in the set with the supplied one; else /// add the supplied one. /// /// The item to look for and update or add /// /// True if item was updated public virtual bool UpdateOrAdd(T item, out T olditem) { updatecheck(); olditem = item; return searchoradd(ref olditem, true, true, true); } /// /// Remove an item from the set /// /// The item to remove /// True if item was (found and) removed [Tested] public virtual bool Remove(T item) { updatecheck(); if (remove(ref item)) { #if SHRINK if (size8) shrink(); #endif raiseForRemove(item); return true; } else return false; } /// /// Remove an item from the set, reporting the actual matching item object. /// /// The value to remove. /// The removed value. /// True if item was found. [Tested] public virtual bool Remove(T item, out T removeditem) { updatecheck(); removeditem = item; if (remove(ref removeditem)) { #if SHRINK if (size8) shrink(); #endif raiseForRemove(removeditem); return true; } else return false; } /// /// Remove all items in a supplied collection from this set. /// /// /// The items to remove. [Tested] public virtual void RemoveAll(SCG.IEnumerable items) where U : T { updatecheck(); RaiseForRemoveAllHandler raiseHandler = new RaiseForRemoveAllHandler(this); bool raise = raiseHandler.MustFire; T jtem; foreach (U item in items) { jtem = item; if (remove(ref jtem) && raise) raiseHandler.Remove(jtem); } #if SHRINK if (size < resizethreshhold / 2 && resizethreshhold > 16) { int newlength = table.Length; while (newlength >= 32 && newlength * fillfactor / 2 > size) newlength /= 2; resize(newlength - 1); } #endif if (raise) raiseHandler.Raise(); } /// /// Remove all items from the set, resetting internal table to initial size. /// [Tested] public virtual void Clear() { updatecheck(); int oldsize = size; clear(); if (ActiveEvents != 0 && oldsize > 0) { raiseCollectionCleared(true, oldsize); raiseCollectionChanged(); } } /// /// Remove all items *not* in a supplied collection from this set. /// /// /// The items to retain [Tested] public virtual void RetainAll(SCG.IEnumerable items) where U : T { updatecheck(); HashSet aux = new HashSet(EqualityComparer); //This only works for sets: foreach (U item in items) if (Contains(item)) { T jtem = item; aux.searchoradd(ref jtem, true, false, false); } if (size == aux.size) return; CircularQueue wasRemoved = null; if ((ActiveEvents & EventTypeEnum.Removed) != 0) { wasRemoved = new CircularQueue(); foreach (T item in this) if (!aux.Contains(item)) wasRemoved.Enqueue(item); } table = aux.table; size = aux.size; #if !REFBUCKET defaultvalid = aux.defaultvalid; defaultitem = aux.defaultitem; #endif indexmask = aux.indexmask; resizethreshhold = aux.resizethreshhold; bits = aux.bits; bitsc = aux.bitsc; #if DEBUG #else randomhashfactor = aux.randomhashfactor; #endif if ((ActiveEvents & EventTypeEnum.Removed) != 0) raiseForRemoveAll(wasRemoved); else if ((ActiveEvents & EventTypeEnum.Changed) != 0) raiseCollectionChanged(); } /// /// Check if all items in a supplied collection is in this set /// (ignoring multiplicities). /// /// The items to look for. /// /// True if all items are found. [Tested] public virtual bool ContainsAll(SCG.IEnumerable items) where U : T { foreach (U item in items) if (!Contains(item)) return false; return true; } /// /// Create an array containing all items in this set (in enumeration order). /// /// The array [Tested] public override T[] ToArray() { T[] res = new T[size]; int index = 0; #if !REFBUCKET if (defaultvalid) res[index++] = defaultitem; #endif for (int i = 0; i < table.Length; i++) { Bucket b = table[i]; #if LINEARPROBING #if REFBUCKET if (b != null) res[index++] = b.item; #else if (!isnull(b.item)) res[index++] = b.item; #endif #else #if REFBUCKET while (b != null) { res[index++] = b.item; b = b.overflow; } #else if (!isnull(b.item)) { res[index++] = b.item; OverflowBucket ob = b.overflow; while (ob != null) { res[index++] = ob.item; ob = ob.overflow; } } #endif #endif } Debug.Assert(size == index); return res; } /// /// Count the number of times an item is in this set (either 0 or 1). /// /// The item to look for. /// 1 if item is in set, 0 else [Tested] public virtual int ContainsCount(T item) { return Contains(item) ? 1 : 0; } /// /// /// /// public virtual ICollectionValue UniqueItems() { return this; } /// /// /// /// public virtual ICollectionValue> ItemMultiplicities() { return new MultiplicityOne(this); } /// /// Remove all (at most 1) copies of item from this set. /// /// The item to remove [Tested] public virtual void RemoveAllCopies(T item) { Remove(item); } #endregion #region IEnumerable Members /// /// Choose some item of this collection. /// /// if collection is empty. /// [Tested] public override T Choose() { int len = table.Length; if (size == 0) throw new NoSuchItemException(); #if REFBUCKET do { if (++lastchosen >= len) lastchosen = 0; } while (table[lastchosen] == null); #else if (defaultvalid) return defaultitem; do { if (++lastchosen >= len) lastchosen = 0; } while (isnull(table[lastchosen].item)); #endif return table[lastchosen].item; } /// /// Create an enumerator for this set. /// /// The enumerator [Tested] public override SCG.IEnumerator GetEnumerator() { int index = -1; int mystamp = stamp; int len = table.Length; #if LINEARPROBING #if REFBUCKET while (++index < len) { if (mystamp != stamp) throw new CollectionModifiedException(); if (table[index] != null) yield return table[index].item; } #else if (defaultvalid) yield return defaultitem; while (++index < len) { if (mystamp != stamp) throw new CollectionModifiedException(); T item = table[index].item; if (!isnull(item)) yield return item; } #endif #else #if REFBUCKET Bucket b = null; #else OverflowBucket ob = null; if (defaultvalid) yield return defaultitem; #endif while (true) { if (mystamp != stamp) throw new CollectionModifiedException(); #if REFBUCKET if (b == null || b.overflow == null) { do { if (++index >= len) yield break; } while (table[index] == null); b = table[index]; yield return b.item; } else { b = b.overflow; yield return b.item; } #else if (ob != null && ob.overflow != null) { ob = ob.overflow; yield return ob.item; } else if (index >= 0 && ob == null && (ob = table[index].overflow) != null) { yield return ob.item; } else { do { if (++index >= len) yield break; } while (isnull(table[index].item)); yield return table[index].item; ob = null; } #endif } #endif } #endregion #region ISink Members /// /// Report if this is a set collection. /// /// Always false [Tested] public virtual bool AllowsDuplicates { [Tested]get { return false; } } /// /// By convention this is true for any collection with set semantics. /// /// True if only one representative of a group of equal items /// is kept in the collection together with the total count. public virtual bool DuplicatesByCounting { get { return true; } } /// /// Add an item to this set. /// /// The item to add. /// True if item was added (i.e. not found) [Tested] public virtual bool Add(T item) { updatecheck(); return !searchoradd(ref item, true, false, true); } /// /// Add an item to this set. /// /// The item to add. [Tested] void SCG.ICollection.Add(T item) { Add(item); } /// /// Add the elements from another collection with a more specialized item type /// to this collection. Since this /// collection has set semantics, only items not already in the collection /// will be added. /// /// The type of items to add /// The items to add [Tested] public virtual void AddAll(SCG.IEnumerable items) where U : T { updatecheck(); bool wasChanged = false; bool raiseAdded = (ActiveEvents & EventTypeEnum.Added) != 0; CircularQueue wasAdded = raiseAdded ? new CircularQueue() : null; foreach (T item in items) { T jtem = item; if (!searchoradd(ref jtem, true, false, false)) { wasChanged = true; if (raiseAdded) wasAdded.Enqueue(item); } } //TODO: implement a RaiseForAddAll() method if (raiseAdded & wasChanged) foreach (T item in wasAdded) raiseItemsAdded(item, 1); if (((ActiveEvents & EventTypeEnum.Changed) != 0 && wasChanged)) raiseCollectionChanged(); } #endregion #region Diagnostics /// /// Test internal structure of data (invariants) /// /// True if pass [Tested] public virtual bool Check() { int count = 0; #if LINEARPROBING int lasthole = table.Length - 1; #if REFBUCKET while (lasthole >= 0 && table[lasthole] != null) #else while (lasthole >= 0 && !isnull(table[lasthole].item)) #endif { lasthole--; count++; } if (lasthole < 0) { Console.WriteLine("Table is completely filled!"); return false; } for (int cellindex = lasthole + 1, s = table.Length; cellindex < s; cellindex++) { Bucket b = table[cellindex]; int hashindex = hv2i(b.hashval); if (hashindex <= lasthole || hashindex > cellindex) { Console.WriteLine("Bad cell item={0}, hashval={1}, hashindex={2}, cellindex={3}, lasthole={4}", b.item, b.hashval, hashindex, cellindex, lasthole); return false; } } int latesthole = -1; for (int cellindex = 0; cellindex < lasthole; cellindex++) { Bucket b = table[cellindex]; #if REFBUCKET if (b != null) #else if (!isnull(b.item)) #endif { count++; int hashindex = hv2i(b.hashval); if (cellindex < hashindex && hashindex <= lasthole) { Console.WriteLine("Bad cell item={0}, hashval={1}, hashindex={2}, cellindex={3}, latesthole={4}", b.item, b.hashval, hashindex, cellindex, latesthole); return false; } } else { latesthole = cellindex; break; } } for (int cellindex = latesthole + 1; cellindex < lasthole; cellindex++) { Bucket b = table[cellindex]; #if REFBUCKET if (b != null) #else if (!isnull(b.item)) #endif { count++; int hashindex = hv2i(b.hashval); if (hashindex <= latesthole || cellindex < hashindex) { Console.WriteLine("Bad cell item={0}, hashval={1}, hashindex={2}, cellindex={3}, latesthole={4}", b.item, b.hashval, hashindex, cellindex, latesthole); return false; } } else { latesthole = cellindex; } } return true; #else bool retval = true; if (bitsc != 32 - bits) { Console.WriteLine("bitsc != 32 - bits ({0}, {1})", bitsc, bits); retval = false; } if (indexmask != (1 << bits) - 1) { Console.WriteLine("indexmask != (1 << bits) - 1 ({0}, {1})", indexmask, bits); retval = false; } if (table.Length != indexmask + 1) { Console.WriteLine("table.Length != indexmask + 1 ({0}, {1})", table.Length, indexmask); retval = false; } if (bitsc != 32 - bits) { Console.WriteLine("resizethreshhold != (int)(table.Length * fillfactor) ({0}, {1}, {2})", resizethreshhold, table.Length, fillfactor); retval = false; } for (int i = 0, s = table.Length; i < s; i++) { int level = 0; Bucket b = table[i]; #if REFBUCKET while (b != null) { if (i != hv2i(b.hashval)) { Console.WriteLine("Bad cell item={0}, hashval={1}, index={2}, level={3}", b.item, b.hashval, i, level); retval = false; } count++; level++; b = b.overflow; } #else if (!isnull(b.item)) { count++; if (i != hv2i(b.hashval)) { Console.WriteLine("Bad cell item={0}, hashval={1}, index={2}, level={3}", b.item, b.hashval, i, level); retval = false; } OverflowBucket ob = b.overflow; while (ob != null) { level++; count++; if (i != hv2i(ob.hashval)) { Console.WriteLine("Bad cell item={0}, hashval={1}, index={2}, level={3}", b.item, b.hashval, i, level); retval = false; } ob = ob.overflow; } } #endif } if (count != size) { Console.WriteLine("size({0}) != count({1})", size, count); retval = false; } return retval; #endif } /// /// Produce statistics on distribution of bucket sizes. Current implementation is incomplete. /// /// Histogram data. [Tested(via = "Manually")] public ISortedDictionary BucketCostDistribution() { TreeDictionary res = new TreeDictionary(); #if LINEARPROBING int count = 0; #if REFBUCKET while (table[count] != null) #else while (!isnull(table[count].item)) #endif count++; for (int i = table.Length - 1; i >= 0; i--) { #if REFBUCKET if (table[i] != null) #else if (!isnull(table[i].item)) #endif count++; else count = 0; if (res.Contains(count)) res[count]++; else res[count] = 1; } return res; #else for (int i = 0, s = table.Length; i < s; i++) { int count = 0; #if REFBUCKET Bucket b = table[i]; while (b != null) { count++; b = b.overflow; } #else Bucket b = table[i]; if (!isnull(b.item)) { count = 1; OverflowBucket ob = b.overflow; while (ob != null) { count++; ob = ob.overflow; } } #endif if (res.Contains(count)) res[count]++; else res[count] = 1; } return res; #endif } #endregion #region ICloneable Members /// /// Make a shallow copy of this HashSet. /// /// public virtual object Clone() { HashSet clone = new HashSet(size > 0 ? size : 1, itemequalityComparer); //TODO: make sure this really adds in the counting bag way! clone.AddAll(this); return clone; } #endregion } }