luni/src/main/java/org/apache/harmony/security/provider/cert/Cache.java - platform/libcore-snapshot - Git at Google

 /*
  *  Licensed to the Apache Software Foundation (ASF) under one or more
  *  contributor license agreements.  See the NOTICE file distributed with
  *  this work for additional information regarding copyright ownership.
  *  The ASF licenses this file to You under the Apache License, Version 2.0
  *  (the "License"); you may not use this file except in compliance with
  *  the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  *  Unless required by applicable law or agreed to in writing, software
  *  distributed under the License is distributed on an "AS IS" BASIS,
  *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  *  See the License for the specific language governing permissions and
  *  limitations under the License.
  */

 /**
 * @author Alexander Y. Kleymenov
 * @version $Revision$
 */

 package org.apache.harmony.security.provider.cert;

 import java.util.Arrays;

 /**
  * The caching mechanism designed to speed up the process
  * of Certificates/CRLs generation in the case of their repeated
  * generation.
  *
  * It keeps correspondences between Objects (Certificates or CLRs)
  * and arrays of bytes on the base of which the Objects have been generated,
  * and provides the means to determine whether it contains the object built on
  * the base of particular encoded form or not. If there are such
  * objects they are returned from the cache, if not - newly generated
  * objects can be saved in the cache.<br>
  *
  * The process of Certificate/CRL generation
  * (implemented in <code>X509CertFactoryImpl</code>) is accompanied with
  * prereading of the beginning of encoded form. This prefix is used to determine
  * whether provided form is PEM encoding or not.<br>
  *
  * So the use of the prefix is the first point to (approximately)
  * determine whether object to be generated is in the cache or not.
  *
  * The failure of the predetermination process tells us that there were not
  * object generated from the encoded form with such prefix and we should
  * generate (decode) the object. If predetermination is successful,
  * we conduct the accurate search on the base of whole encoded form. <br>
  *
  * So to speed up the object generation process this caching mechanism provides
  * the following functionality:<br>
  *
  *      1. With having of the beginning of the encoded form (prefix)
  * it is possible to predetermine whether object has already been
  * generated on the base of the encoding with the SIMILAR prefix or not.
  * This process is not computationally expensive and takes a little time.
  * But it prevents us from use of expensive full encoding
  * search in the case of its failure.<br>
  *
  *      2. If predetermination ends with success, the whole encoding
  * form should be provided to make the final answer: whether object has
  * already been generated on the base of this PARTICULAR encoded form or not.
  * If it is so - the cached object is returned from the cache,
  * if not - new object should be generated and saved in the cache.<br>
  *
  * Note: The length of the prefixes of the encoded forms should not be
  * less than correspondence (default value is 28).
  */
 public class Cache {

     // Hash code consist of 6 bytes: AABB00
     // where:
     // AA - 2 bytes for prefix hash
     //      value generated on the base of the prefix of encoding
     // BB - 2 bytes for tail hash
     //      value generated on the base of the tail of encoding
     // 00 - 2 reserved bytes equals to 0
     //
     // Note, that it is possible for 2 different arrays to have
     // the similar hash codes.

     // The masks to work with hash codes:
     // the hash code without the reserved bytes
     private static final long HASH_MASK = 0xFFFFFFFFFFFF0000L;
     // the hash code of the prefix
     private static final long PREFIX_HASH_MASK = 0xFFFFFFFF00000000L;
     // the index value contained in reserved bytes
     private static final int  INDEX_MASK = 0x00FFFF;

     // size of the cache
     private final int cache_size;
     // the number of bytes which will be used for array hash generation.
     private final int prefix_size;

     // The following 3 arrays contain the information about cached objects.
     // This information includes: hash of the array, encoded form of the object,
     // and the object itself.
     // The hash-encoding-object correspondence is made by means of index
     // in the particular array. I.e. for index N hash contained in hashes[N]
     // corresponds to the encoding contained in encodings[N] which corresponds
     // to the object cached at cache[N]

     // array containing the hash codes of encodings
     private final long[] hashes;
     // array containing the encodings of the cached objects
     private final byte[][] encodings;
     // array containing the cached objects
     private final Object[] cache;

     // This array is used to speed up the process of the search in the cache.
     // This is an ordered array of the hash codes from 'hashes' array (described
     // above) with last 2 (reserved) bytes equals to the index of
     // the hash in the 'hashes' array. I.e. hash code ABCD00 with index 10 in
     // the hashes array will be represented in this array as ABCD0A (10==0x0A)
     // So this array contains ordered <hash to index> correspondences.
     // Note, that every item in this array is unique.
     private final long[] hashes_idx;

     // the index of the last cached object
     private int last_cached = 0;
     // cache population indicator
     private boolean cache_is_full = false;

     /**
      * Creates the Cache object.
      * @param pref_size specifies how many leading/trailing bytes of object's
      * encoded form will be used for hash computation
      * @param size capacity of the cache to be created.
      */
     public Cache(int pref_size, int size) {
         cache_size = size;
         prefix_size = pref_size;
         hashes = new long[cache_size];
         hashes_idx = new long[cache_size];
         encodings = new byte[cache_size][];
         cache = new Object[cache_size];
     }

     /**
      * Creates the Cache object of size of 9.
      * @param pref_size specifies how many leading/trailing bytes of object's
      * encoded form will be used for hash computation
      */
     public Cache(int pref_size) {
         this(pref_size, 9);
     }

     /**
      * Creates the Cache object of size of 9.
      */
     public Cache() {
         this(28, 9);
     }

     /**
      * Returns the hash code for the array. This code is used to
      * predetermine whether the object was built on the base of the
      * similar encoding or not (by means of <code>contains(long)</code> method),
      * to exactly determine whether object is contained in the cache or not,
      * and to put the object in the cache.
      * Note: parameter array should be of length not less than
      * specified by <code>prefix_size</code> (default 28)
      * @param arr the byte array containing at least prefix_size leading bytes
      * of the encoding.
      * @return hash code for specified encoding prefix
      */
     public long getHash(byte[] arr) {
         long hash = 0;
         for (int i=1; i<prefix_size; i++) {
             hash += (arr[i] & 0xFF);
         } // it takes about 2 bytes for prefix_size == 28

         // shift to the correct place
         hash = hash << 32;
         return hash;
     }

     /**
      * Checks if there are any object in the cache generated
      * on the base of encoding with prefix corresponding
      * to the specified hash code.
      * @param prefix_hash the hash code for the prefix
      * of the encoding (retrieved by method <code>getHash(byte[]))</code>
      * @return false if there were not any object generated
      * on the base of encoding with specified hash code, true
      * otherwise.
      */
     public boolean contains(long prefix_hash) {
         if (prefix_hash == 0) {
             return false;
         }
         int idx = -1*Arrays.binarySearch(hashes_idx, prefix_hash)-1;
         if (idx == cache_size) {
             return false;
         } else {
             return (hashes_idx[idx] & PREFIX_HASH_MASK) == prefix_hash;
         }
     }

     /**
      * Returns the object built on the base on the specified encoded
      * form if it is contained in the cache and null otherwise.
      * This method is computationally expensive and should be called only if
      * the method <code>contains(long)</code> for the hash code returned true.
      * @param hash the hash code for the prefix of the encoding
      * (retrieved by method <code>getHash(byte[])</code>)
      * @param encoding encoded form of the required object.
      * @return the object corresponding to specified encoding or null if
      * there is no such correspondence.
      */
     public Object get(long hash, byte[] encoding) {
         hash |= getSuffHash(encoding);
         if (hash == 0) {
             return null;
         }
         int idx = -1*Arrays.binarySearch(hashes_idx, hash)-1;
         if (idx == cache_size) {
             return null;
         }
         while ((hashes_idx[idx] & HASH_MASK) == hash) {
             int i = (int) (hashes_idx[idx] & INDEX_MASK) - 1;
             if (Arrays.equals(encoding, encodings[i])) {
                 return cache[i];
             }
             idx++;
             if (idx == cache_size) {
                 return null;
             }
         }
         return null;
     }

     /**
      * Puts the object into the cache.
      * @param hash hash code for the prefix of the encoding
      * @param encoding the encoded form of the object
      * @param object the object to be saved in the cache
      */
     public void put(long hash, byte[] encoding, Object object) {
         // check for empty space in the cache
         if (last_cached == cache_size) {
             // so cache is full, will erase the first entry in the
             // cache (oldest entry). it could be better to throw out
             // rarely used value instead of oldest one..
             last_cached = 0;
             cache_is_full = true;
         }
         // index pointing to the item of the table to be overwritten
         int index = last_cached++;

         // improve the hash value with info from the tail of encoding
         hash |= getSuffHash(encoding);

         if (cache_is_full) {
             // indexing hash value to be overwritten:
             long idx_hash = (hashes[index] | (index+1));
             int idx = Arrays.binarySearch(hashes_idx, idx_hash);
             if (idx < 0) {
                 // it will never happen because we use saved hash value
                 // (hashes[index])
                 System.out.println("WARNING! "+idx);
                 idx = -(idx + 1);
             }
             long new_hash_idx = (hash | (index + 1));
             int new_idx = Arrays.binarySearch(hashes_idx, new_hash_idx);
             if (new_idx >= 0) {
                 // it's possible when we write the same hash in the same cell
                 if (idx != new_idx) {
                     // it will never happen because we use the same
                     // hash and the same index in hash table
                     System.out.println("WARNING: ");
                     System.out.println(">> idx: "+idx+" new_idx: "+new_idx);
                 }
             } else {
                 new_idx = -(new_idx + 1);
                 // replace in sorted array
                 if (new_idx > idx) {
                     System.arraycopy(hashes_idx, idx+1, hashes_idx, idx,
                             new_idx - idx - 1);
                     hashes_idx[new_idx-1] = new_hash_idx;
                 } else if (idx > new_idx) {
                     System.arraycopy(hashes_idx, new_idx, hashes_idx, new_idx+1,
                             idx - new_idx);
                     hashes_idx[new_idx] = new_hash_idx;
                 } else { // idx == new_idx
                     hashes_idx[new_idx] = new_hash_idx;
                 }
             }
         } else {
             long idx_hash = (hash | (index + 1));
             int idx = Arrays.binarySearch(hashes_idx, idx_hash);
             if (idx < 0) {
                 // it will always be true because idx_hash depends on index
                 idx = -(idx + 1);
             }
             idx = idx - 1;
             if (idx != cache_size - index - 1) {
                 // if not in the cell containing 0 (free cell), do copy:
                 System.arraycopy(hashes_idx, cache_size - index,
                         hashes_idx, cache_size - index - 1,
                         idx - (cache_size - index) + 1);
             }
             hashes_idx[idx] = idx_hash;
         }
         // overwrite the values in the tables:
         hashes[index] = hash;
         encodings[index] = encoding;
         cache[index] = object;
     }

     // Returns the hash code built on the base of the tail of the encoded form
     // @param arr - the array containing at least prefix_size trailing bytes
     // of encoded form
     private long getSuffHash(byte[] arr) {
         long hash_addon = 0;
         for (int i=arr.length-1; i>arr.length - prefix_size; i--) {
             hash_addon += (arr[i] & 0xFF);
         }
         return hash_addon << 16;
     }

 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	/**
	* @author Alexander Y. Kleymenov
	* @version $Revision$
	*/

	package org.apache.harmony.security.provider.cert;

	import java.util.Arrays;

	/**
	* The caching mechanism designed to speed up the process
	* of Certificates/CRLs generation in the case of their repeated
	* generation.
	*
	* It keeps correspondences between Objects (Certificates or CLRs)
	* and arrays of bytes on the base of which the Objects have been generated,
	* and provides the means to determine whether it contains the object built on
	* the base of particular encoded form or not. If there are such
	* objects they are returned from the cache, if not - newly generated
	* objects can be saved in the cache.<br>
	*
	* The process of Certificate/CRL generation
	* (implemented in <code>X509CertFactoryImpl</code>) is accompanied with
	* prereading of the beginning of encoded form. This prefix is used to determine
	* whether provided form is PEM encoding or not.<br>
	*
	* So the use of the prefix is the first point to (approximately)
	* determine whether object to be generated is in the cache or not.
	*
	* The failure of the predetermination process tells us that there were not
	* object generated from the encoded form with such prefix and we should
	* generate (decode) the object. If predetermination is successful,
	* we conduct the accurate search on the base of whole encoded form. <br>
	*
	* So to speed up the object generation process this caching mechanism provides
	* the following functionality:<br>
	*
	* 1. With having of the beginning of the encoded form (prefix)
	* it is possible to predetermine whether object has already been
	* generated on the base of the encoding with the SIMILAR prefix or not.
	* This process is not computationally expensive and takes a little time.
	* But it prevents us from use of expensive full encoding
	* search in the case of its failure.<br>
	*
	* 2. If predetermination ends with success, the whole encoding
	* form should be provided to make the final answer: whether object has
	* already been generated on the base of this PARTICULAR encoded form or not.
	* If it is so - the cached object is returned from the cache,
	* if not - new object should be generated and saved in the cache.<br>
	*
	* Note: The length of the prefixes of the encoded forms should not be
	* less than correspondence (default value is 28).
	*/
	public class Cache {

	// Hash code consist of 6 bytes: AABB00
	// where:
	// AA - 2 bytes for prefix hash
	// value generated on the base of the prefix of encoding
	// BB - 2 bytes for tail hash
	// value generated on the base of the tail of encoding
	// 00 - 2 reserved bytes equals to 0
	//
	// Note, that it is possible for 2 different arrays to have
	// the similar hash codes.

	// The masks to work with hash codes:
	// the hash code without the reserved bytes
	private static final long HASH_MASK = 0xFFFFFFFFFFFF0000L;
	// the hash code of the prefix
	private static final long PREFIX_HASH_MASK = 0xFFFFFFFF00000000L;
	// the index value contained in reserved bytes
	private static final int INDEX_MASK = 0x00FFFF;

	// size of the cache
	private final int cache_size;
	// the number of bytes which will be used for array hash generation.
	private final int prefix_size;

	// The following 3 arrays contain the information about cached objects.
	// This information includes: hash of the array, encoded form of the object,
	// and the object itself.
	// The hash-encoding-object correspondence is made by means of index
	// in the particular array. I.e. for index N hash contained in hashes[N]
	// corresponds to the encoding contained in encodings[N] which corresponds
	// to the object cached at cache[N]

	// array containing the hash codes of encodings
	private final long[] hashes;
	// array containing the encodings of the cached objects
	private final byte[][] encodings;
	// array containing the cached objects
	private final Object[] cache;

	// This array is used to speed up the process of the search in the cache.
	// This is an ordered array of the hash codes from 'hashes' array (described
	// above) with last 2 (reserved) bytes equals to the index of
	// the hash in the 'hashes' array. I.e. hash code ABCD00 with index 10 in
	// the hashes array will be represented in this array as ABCD0A (10==0x0A)
	// So this array contains ordered <hash to index> correspondences.
	// Note, that every item in this array is unique.
	private final long[] hashes_idx;

	// the index of the last cached object
	private int last_cached = 0;
	// cache population indicator
	private boolean cache_is_full = false;

	/**
	* Creates the Cache object.
	* @param pref_size specifies how many leading/trailing bytes of object's
	* encoded form will be used for hash computation
	* @param size capacity of the cache to be created.
	*/
	public Cache(int pref_size, int size) {
	cache_size = size;
	prefix_size = pref_size;
	hashes = new long[cache_size];
	hashes_idx = new long[cache_size];
	encodings = new byte[cache_size][];
	cache = new Object[cache_size];
	}

	/**
	* Creates the Cache object of size of 9.
	* @param pref_size specifies how many leading/trailing bytes of object's
	* encoded form will be used for hash computation
	*/
	public Cache(int pref_size) {
	this(pref_size, 9);
	}

	/**
	* Creates the Cache object of size of 9.
	*/
	public Cache() {
	this(28, 9);
	}

	/**
	* Returns the hash code for the array. This code is used to
	* predetermine whether the object was built on the base of the
	* similar encoding or not (by means of <code>contains(long)</code> method),
	* to exactly determine whether object is contained in the cache or not,
	* and to put the object in the cache.
	* Note: parameter array should be of length not less than
	* specified by <code>prefix_size</code> (default 28)
	* @param arr the byte array containing at least prefix_size leading bytes
	* of the encoding.
	* @return hash code for specified encoding prefix
	*/
	public long getHash(byte[] arr) {
	long hash = 0;
	for (int i=1; i<prefix_size; i++) {
	hash += (arr[i] & 0xFF);
	} // it takes about 2 bytes for prefix_size == 28

	// shift to the correct place
	hash = hash << 32;
	return hash;
	}

	/**
	* Checks if there are any object in the cache generated
	* on the base of encoding with prefix corresponding
	* to the specified hash code.
	* @param prefix_hash the hash code for the prefix
	* of the encoding (retrieved by method <code>getHash(byte[]))</code>
	* @return false if there were not any object generated
	* on the base of encoding with specified hash code, true
	* otherwise.
	*/
	public boolean contains(long prefix_hash) {
	if (prefix_hash == 0) {
	return false;
	}
	int idx = -1*Arrays.binarySearch(hashes_idx, prefix_hash)-1;
	if (idx == cache_size) {
	return false;
	} else {
	return (hashes_idx[idx] & PREFIX_HASH_MASK) == prefix_hash;
	}
	}

	/**
	* Returns the object built on the base on the specified encoded
	* form if it is contained in the cache and null otherwise.
	* This method is computationally expensive and should be called only if
	* the method <code>contains(long)</code> for the hash code returned true.
	* @param hash the hash code for the prefix of the encoding
	* (retrieved by method <code>getHash(byte[])</code>)
	* @param encoding encoded form of the required object.
	* @return the object corresponding to specified encoding or null if
	* there is no such correspondence.
	*/
	public Object get(long hash, byte[] encoding) {
	hash \|= getSuffHash(encoding);
	if (hash == 0) {
	return null;
	}
	int idx = -1*Arrays.binarySearch(hashes_idx, hash)-1;
	if (idx == cache_size) {
	return null;
	}
	while ((hashes_idx[idx] & HASH_MASK) == hash) {
	int i = (int) (hashes_idx[idx] & INDEX_MASK) - 1;
	if (Arrays.equals(encoding, encodings[i])) {
	return cache[i];
	}
	idx++;
	if (idx == cache_size) {
	return null;
	}
	}
	return null;
	}

	/**
	* Puts the object into the cache.
	* @param hash hash code for the prefix of the encoding
	* @param encoding the encoded form of the object
	* @param object the object to be saved in the cache
	*/
	public void put(long hash, byte[] encoding, Object object) {
	// check for empty space in the cache
	if (last_cached == cache_size) {
	// so cache is full, will erase the first entry in the
	// cache (oldest entry). it could be better to throw out
	// rarely used value instead of oldest one..
	last_cached = 0;
	cache_is_full = true;
	}
	// index pointing to the item of the table to be overwritten
	int index = last_cached++;

	// improve the hash value with info from the tail of encoding
	hash \|= getSuffHash(encoding);

	if (cache_is_full) {
	// indexing hash value to be overwritten:
	long idx_hash = (hashes[index] \| (index+1));
	int idx = Arrays.binarySearch(hashes_idx, idx_hash);
	if (idx < 0) {
	// it will never happen because we use saved hash value
	// (hashes[index])
	System.out.println("WARNING! "+idx);
	idx = -(idx + 1);
	}
	long new_hash_idx = (hash \| (index + 1));
	int new_idx = Arrays.binarySearch(hashes_idx, new_hash_idx);
	if (new_idx >= 0) {
	// it's possible when we write the same hash in the same cell
	if (idx != new_idx) {
	// it will never happen because we use the same
	// hash and the same index in hash table
	System.out.println("WARNING: ");
	System.out.println(">> idx: "+idx+" new_idx: "+new_idx);
	}
	} else {
	new_idx = -(new_idx + 1);
	// replace in sorted array
	if (new_idx > idx) {
	System.arraycopy(hashes_idx, idx+1, hashes_idx, idx,
	new_idx - idx - 1);
	hashes_idx[new_idx-1] = new_hash_idx;
	} else if (idx > new_idx) {
	System.arraycopy(hashes_idx, new_idx, hashes_idx, new_idx+1,
	idx - new_idx);
	hashes_idx[new_idx] = new_hash_idx;
	} else { // idx == new_idx
	hashes_idx[new_idx] = new_hash_idx;
	}
	}
	} else {
	long idx_hash = (hash \| (index + 1));
	int idx = Arrays.binarySearch(hashes_idx, idx_hash);
	if (idx < 0) {
	// it will always be true because idx_hash depends on index
	idx = -(idx + 1);
	}
	idx = idx - 1;
	if (idx != cache_size - index - 1) {
	// if not in the cell containing 0 (free cell), do copy:
	System.arraycopy(hashes_idx, cache_size - index,
	hashes_idx, cache_size - index - 1,
	idx - (cache_size - index) + 1);
	}
	hashes_idx[idx] = idx_hash;
	}
	// overwrite the values in the tables:
	hashes[index] = hash;
	encodings[index] = encoding;
	cache[index] = object;
	}

	// Returns the hash code built on the base of the tail of the encoded form
	// @param arr - the array containing at least prefix_size trailing bytes
	// of encoded form
	private long getSuffHash(byte[] arr) {
	long hash_addon = 0;
	for (int i=arr.length-1; i>arr.length - prefix_size; i--) {
	hash_addon += (arr[i] & 0xFF);
	}
	return hash_addon << 16;
	}

	}