Subversion Repositories splitter

Rev

Rev 32 | Blame | Compare with Previous | Last modification | View Log | RSS feed

/*
 * Copyright (C) 2008 Steve Ratcliffe
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License version 3
 *  as published by the Free Software Foundation.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *
 * Author: Steve Ratcliffe
 * Create date: 19-Dec-2008
 */

package uk.me.parabola.splitter;

import java.util.Iterator;


/**
 * An int/int map that is split into several smaller maps.  This is to avoid the problem where
 * rehashing a map temporarily consumes twice as much memory as is actually required.
 * We only ever have to rehash one of the sub maps at a time and therefore much less
 * temporary space is required.
 *
 * It is all a balance though, there is an overhead in each map because of the load factor.
 * Also it is going to be slower overall.  So splitting into 4 seems about right.
 *
 * @author Steve Ratcliffe
 */

public class SplitIntMap {
        private static final int NMAPS = 4;
        private static final int MASK = NMAPS-1;

        private static final int INIT_CAP = 1<<16;
        private static final float LOAD = 0.7f;

        private int size;

        private final IntIntMap[] maps = new IntIntMap[NMAPS];

        public SplitIntMap() {
                for (int i = 0; i < NMAPS; i++) {
                        maps[i] = new IntIntMap(INIT_CAP, LOAD);
                        //maps[i].growthFactor(4);
                }
        }


        public void put(int key, int value) {
                maps[key & MASK].put(key, value);
        }

        public int get(int key) {
                return maps[key & MASK].get(key);
        }

        public int size() {
                if (this.size != 0)
                        return size;

                int size = 0;
                for (int i = 0; i < NMAPS; i++) {
                        size += maps[i].size();
                }
                return size;
        }

        /**
         * An iterate over the entry set of the map.  The same Entry object is returned
         * each time.
         * @return An iterator that uses the same object each time it returns, with different
         * values filled in.
         */

        public Iterator<IntIntMap.Entry> fastIterator() {
                return new NormalObjectIterator();
        }

        /**
         * The deleting iterator takes case of the case where you are transfering the entries from
         * one map to another.  Once they are read, they are no longer needed and so the map
         * can be freed.  This avoids avoids using double the memory when splitting the areas.
         * @return An iterator over the entry set.  The same Entry is returned each time.
         */

        public Iterator<IntIntMap.Entry> fastDeletingIterator() {
                return new NormalObjectIterator(true);
        }

        /**
         * Trim the map down to its minimum size.  This can be used when we are not going to
         * add to the map any more to reduce the overhead of having several sub-maps.
         */

        public void trim() {
                for (int i = 0; i < NMAPS; i++) {
                        //maps[i].trim();
                }
        }

        /**
         * Iterates over all the sub-maps.
         */

        private class NormalObjectIterator implements Iterator<IntIntMap.Entry> {

                private final boolean deleteAfter;

                private final Iterator[] iterators = new Iterator[NMAPS];

                private int currentMap;

                private NormalObjectIterator(boolean deleteAfter) {
                        if (deleteAfter)
                                fixSize();
                       
                        this.deleteAfter = deleteAfter;
                        for (int i = 0; i < NMAPS; i++) {
                                iterators[i] = maps[i].entryIterator();
                        }
                }

                private NormalObjectIterator() {
                        this(false);
                }

                /**
                 * Note that you have to call this for the call to next() to be correct
                 * and so it doesn't properly follow the contract for hasNext() on the
                 * regular Iterator.
                 */

                public boolean hasNext() {
                        // All done
                        if (currentMap >= NMAPS)
                                return false;

                        // easy case:
                        if (iterators[currentMap].hasNext())
                                return true;

                        // Else step to the next one and try it
                        if (deleteAfter) {
                                iterators[currentMap] = null;
                                maps[currentMap] = null;
                        }
                        currentMap++;
                        return hasNext();
                }

                public IntIntMap.Entry next() {
                        return (IntIntMap.Entry) iterators[currentMap].next();
                }

                public void remove() {
                        throw new UnsupportedOperationException();
                }

                private void fixSize() {
                        size = size();
                }
        }
}