blob: fd3c9c4dc25537b5d96071d0ceaa83552d09773d [file] [log] [blame]
/*
* Copyright (C) 2010 The Guava Authors
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.google.common.base;
import com.google.caliper.BeforeExperiment;
import com.google.caliper.Benchmark;
import com.google.caliper.Param;
import java.util.BitSet;
import java.util.Random;
/** Benchmark for the {@link CharMatcher#whitespace} implementation. */
public class WhitespaceMatcherBenchmark {
private static final int STRING_LENGTH = 10000;
private static final String OLD_WHITESPACE_TABLE =
"\u0001\u0000\u00a0\u0000\u0000\u0000\u0000\u0000"
+ "\u0000\u0009\n\u000b\u000c\r\u0000\u0000\u2028\u2029\u0000\u0000\u0000\u0000\u0000"
+ "\u202f\u0000\u0000\u0000\u0000\u0000\u0000\u0000\u0000\u0020\u0000\u0000\u0000\u0000"
+ "\u0000\u0000\u0000\u0000\u0000\u0000\u3000\u0000\u0000\u0000\u0000\u0000\u0000\u0000"
+ "\u0000\u0000\u0000\u0085\u2000\u2001\u2002\u2003\u2004\u2005\u2006\u2007\u2008\u2009"
+ "\u200a\u0000\u0000\u0000\u0000\u0000\u205f\u1680\u0000\u0000\u180e\u0000\u0000\u0000";
public static final CharMatcher OLD_WHITESPACE =
new CharMatcher() {
@Override
public boolean matches(char c) {
return OLD_WHITESPACE_TABLE.charAt(c % 79) == c;
}
};
@Param private boolean useNew;
@Param({"20", "50", "80"})
private int percentMatching;
private String teststring;
private CharMatcher matcher;
@BeforeExperiment
protected void setUp() {
BitSet bitSet = new BitSet();
for (int i = 0; i < OLD_WHITESPACE_TABLE.length(); i++) {
bitSet.set(OLD_WHITESPACE_TABLE.charAt(i));
}
bitSet.clear(0);
bitSet.clear(1);
matcher = useNew ? CharMatcher.whitespace() : OLD_WHITESPACE;
teststring = newTestString(new Random(1), bitSet, percentMatching);
}
@Benchmark
public int countIn(int reps) {
int result = 0;
CharMatcher matcher = this.matcher;
String teststring = this.teststring;
for (int i = 0; i < reps; i++) {
result += matcher.countIn(teststring);
}
return result;
}
@Benchmark
public int collapseFrom(int reps) {
int result = 0;
CharMatcher matcher = this.matcher;
String teststring = this.teststring;
for (int i = 0; i < reps; i++) {
result += System.identityHashCode(matcher.collapseFrom(teststring, ' '));
}
return result;
}
private static String allMatchingChars(BitSet bitSet) {
final char[] result = new char[bitSet.cardinality()];
for (int j = 0, c = bitSet.nextSetBit(0); j < result.length; ++j) {
result[j] = (char) c;
c = bitSet.nextSetBit(c + 1);
}
return new String(result);
}
private static String newTestString(Random random, BitSet bitSet, int percentMatching) {
final String allMatchingChars = allMatchingChars(bitSet);
final char[] result = new char[STRING_LENGTH];
// Fill with matching chars.
for (int i = 0; i < result.length; i++) {
result[i] = allMatchingChars.charAt(random.nextInt(allMatchingChars.length()));
}
// Replace some of chars by non-matching.
int remaining = (int) ((100 - percentMatching) * result.length / 100.0 + 0.5);
while (remaining > 0) {
final char c = (char) random.nextInt();
if (bitSet.get(c)) {
final int pos = random.nextInt(result.length);
if (bitSet.get(result[pos])) {
result[pos] = c;
remaining--;
}
}
}
return new String(result);
}
}