tools/cldr-code/src/main/java/org/unicode/cldr/util/CharUtilities.java - platform/external/cldr - Git at Google

 package org.unicode.cldr.util;

 import java.util.Collection;
 import java.util.Set;
 import java.util.stream.Collectors;

 public class CharUtilities {
     /**
      * Simple wrapper for CharSequence
      *
      * @author markdavis
      */
     public static class CharSourceWrapper<T extends CharSequence> implements CharSource {
         protected T source;

         public CharSourceWrapper(T source) {
             this.source = source;
         }

         @Override
         public boolean hasCharAt(int index) {
             return index < source.length();
         }

         @Override
         public char charAt(int index) {
             return source.charAt(index);
         }

         @Override
         public int toSourceOffset(int index) {
             return index;
         }

         @Override
         public CharSource sublist(int start, int end) {
             return new CharSourceWrapper<>(source.subSequence(start, end));
         }

         @Override
         public CharSource sublist(int start) {
             return new CharSourceWrapper<>(source.subSequence(start, source.length()));
         }

         @Override
         public int getKnownLength() {
             return source.length();
         }

         @Override
         public CharSequence subSequence(int start, int end) {
             return source.subSequence(start, end);
         }

         @Override
         public String toString() {
             return source.toString();
         }

         public CharSequence sourceSubSequence(int start, int end) {
             return source.subSequence(toSourceOffset(start), toSourceOffset(end));
         }

         @Override
         public int fromSourceOffset(int index) {
             return index;
         }

         @Override
         public CharSource setStart(int index) {
             return this;
         }

         @Override
         public int getStart() {
             return 0;
         }
     }

     /**
      * Return the code point order of two CharSequences. If the text has isolated surrogates, they
      * will not sort correctly.
      *
      * @param text1
      * @param text2
      * @return
      */
     public static int compare(CharSource text1, CharSource text2) {
         int i1 = 0;
         int i2 = 0;

         while (true) {
             // handle running out of room
             if (!text1.hasCharAt(i1)) {
                 if (text2.hasCharAt(i2)) {
                     return 0;
                 }
                 return -1;
             } else if (text2.hasCharAt(i2)) {
                 return 1;
             }
             int cp1 = text1.charAt(i1++);
             int cp2 = text2.charAt(i2++);
             // if they are different, do a fixup

             if (cp1 != cp2) {
                 return (cp1 + utf16Fixup[cp1 >> 11]) - (cp2 + utf16Fixup[cp2 >> 11]);
             }
         }
     }

     private static final char utf16Fixup[] = {
         0, 0, 0, 0, 0, 0, 0, 0,
         0, 0, 0, 0, 0, 0, 0, 0,
         0, 0, 0, 0, 0, 0, 0, 0,
         0, 0, 0, 0x2000, 0xf800, 0xf800, 0xf800, 0xf800
     };

     /**
      * Return the code point order of two CharSequences. If the text has isolated surrogates, they
      * will not sort correctly.
      *
      * @param text1
      * @param text2
      * @return
      */
     public static int compare(CharSequence text1, CharSequence text2) {
         int i1 = 0;
         int i2 = 0;

         while (true) {
             // handle running out of room
             if (i1 >= text1.length()) {
                 if (i2 >= text2.length()) {
                     return 0;
                 }
                 return -1;
             } else if (i2 >= text2.length()) {
                 return 1;
             }
             int cp1 = text1.charAt(i1++);
             int cp2 = text2.charAt(i2++);
             // if they are different, do a fixup

             if (cp1 != cp2) {
                 return (cp1 + utf16Fixup[cp1 >> 11]) - (cp2 + utf16Fixup[cp2 >> 11]);
             }
         }
     }

     /** intern each element in the string and return a new unmodifiable Set */
     public static Set<String> internImmutableSet(Collection<String> s) {
         return s.stream().map(String::intern).collect(Collectors.toUnmodifiableSet());
     }
 }
	package org.unicode.cldr.util;

	import java.util.Collection;
	import java.util.Set;
	import java.util.stream.Collectors;

	public class CharUtilities {
	/**
	* Simple wrapper for CharSequence
	*
	* @author markdavis
	*/
	public static class CharSourceWrapper<T extends CharSequence> implements CharSource {
	protected T source;

	public CharSourceWrapper(T source) {
	this.source = source;
	}

	@Override
	public boolean hasCharAt(int index) {
	return index < source.length();
	}

	@Override
	public char charAt(int index) {
	return source.charAt(index);
	}

	@Override
	public int toSourceOffset(int index) {
	return index;
	}

	@Override
	public CharSource sublist(int start, int end) {
	return new CharSourceWrapper<>(source.subSequence(start, end));
	}

	@Override
	public CharSource sublist(int start) {
	return new CharSourceWrapper<>(source.subSequence(start, source.length()));
	}

	@Override
	public int getKnownLength() {
	return source.length();
	}

	@Override
	public CharSequence subSequence(int start, int end) {
	return source.subSequence(start, end);
	}

	@Override
	public String toString() {
	return source.toString();
	}

	public CharSequence sourceSubSequence(int start, int end) {
	return source.subSequence(toSourceOffset(start), toSourceOffset(end));
	}

	@Override
	public int fromSourceOffset(int index) {
	return index;
	}

	@Override
	public CharSource setStart(int index) {
	return this;
	}

	@Override
	public int getStart() {
	return 0;
	}
	}

	/**
	* Return the code point order of two CharSequences. If the text has isolated surrogates, they
	* will not sort correctly.
	*
	* @param text1
	* @param text2
	* @return
	*/
	public static int compare(CharSource text1, CharSource text2) {
	int i1 = 0;
	int i2 = 0;

	while (true) {
	// handle running out of room
	if (!text1.hasCharAt(i1)) {
	if (text2.hasCharAt(i2)) {
	return 0;
	}
	return -1;
	} else if (text2.hasCharAt(i2)) {
	return 1;
	}
	int cp1 = text1.charAt(i1++);
	int cp2 = text2.charAt(i2++);
	// if they are different, do a fixup

	if (cp1 != cp2) {
	return (cp1 + utf16Fixup[cp1 >> 11]) - (cp2 + utf16Fixup[cp2 >> 11]);
	}
	}
	}

	private static final char utf16Fixup[] = {
	0, 0, 0, 0, 0, 0, 0, 0,
	0, 0, 0, 0, 0, 0, 0, 0,
	0, 0, 0, 0, 0, 0, 0, 0,
	0, 0, 0, 0x2000, 0xf800, 0xf800, 0xf800, 0xf800
	};

	/**
	* Return the code point order of two CharSequences. If the text has isolated surrogates, they
	* will not sort correctly.
	*
	* @param text1
	* @param text2
	* @return
	*/
	public static int compare(CharSequence text1, CharSequence text2) {
	int i1 = 0;
	int i2 = 0;

	while (true) {
	// handle running out of room
	if (i1 >= text1.length()) {
	if (i2 >= text2.length()) {
	return 0;
	}
	return -1;
	} else if (i2 >= text2.length()) {
	return 1;
	}
	int cp1 = text1.charAt(i1++);
	int cp2 = text2.charAt(i2++);
	// if they are different, do a fixup

	if (cp1 != cp2) {
	return (cp1 + utf16Fixup[cp1 >> 11]) - (cp2 + utf16Fixup[cp2 >> 11]);
	}
	}
	}

	/** intern each element in the string and return a new unmodifiable Set */
	public static Set<String> internImmutableSet(Collection<String> s) {
	return s.stream().map(String::intern).collect(Collectors.toUnmodifiableSet());
	}
	}