Java Examples & Tutorials of Character.getType (java.lang)

 /**
  * Returns true if a character is a control character, and
  * false otherwise.
  * 
  * @param c
  * @return
  */
 public static boolean isControl(char c) {
  return Character.getType(c) == Character.CONTROL;
 }
}

/**
 * Returns true if a character is a symbol, and false
 * otherwise.
 * 
 * @param c
 * @return
 */
public static boolean isSymbol(char c) {
 int cType = Character.getType(c);
 return cType == Character.MATH_SYMBOL || 
   cType == Character.CURRENCY_SYMBOL ||
   cType == Character.MODIFIER_SYMBOL ||
   cType == Character.OTHER_SYMBOL;
}

/**
 * Returns true if a character is punctuation, and false
 * otherwise.
 * 
 * @param c
 * @return
 */
public static boolean isPunctuation(char c) {
 int cType = Character.getType(c);
 return cType == Character.START_PUNCTUATION ||
   cType == Character.END_PUNCTUATION ||
   cType == Character.OTHER_PUNCTUATION ||
   cType == Character.CONNECTOR_PUNCTUATION ||
   cType == Character.DASH_PUNCTUATION ||
   cType == Character.INITIAL_QUOTE_PUNCTUATION ||
   cType == Character.FINAL_QUOTE_PUNCTUATION;
}

/**
 * Gets the general Unicode category of the specified character.
 *
 * @param c
 *            the character to get the category of.
 * @return the Unicode category of {@code c}.
 */
public static int getType(char c) {
  return getType((int) c);
}

public static boolean isPrintableUnicode(char c) {
 int t = Character.getType(c);
 return t != Character.UNASSIGNED && t != Character.LINE_SEPARATOR && t != Character.PARAGRAPH_SEPARATOR &&
     t != Character.CONTROL && t != Character.FORMAT && t != Character.PRIVATE_USE && t != Character.SURROGATE;
}

  @Override
  public boolean contains(int ch) {
    return alt ^ (category == Character.getType((char) ch));
  }
}

  @Override
  public boolean contains(int ch) {
    return alt ^ ((category >> Character.getType((char) ch)) & 1) != 0;
  }
}

public static boolean isInvisibleChar(int c) {
  return Character.getType(c) == 16 && (c == 8203 || c == 8204 || c == 8205 || c == 173);
  // zero width sp, zw non join, zw join, soft hyphen
}

/**
 * Classify a character into 5 categories that determine the word break.
 */
protected int classify(char c0) {
  switch(Character.getType(c0)) {
  case Character.UPPERCASE_LETTER:        return UPPER_LETTER;
  case Character.LOWERCASE_LETTER:        return LOWER_LETTER;
  case Character.TITLECASE_LETTER:
  case Character.MODIFIER_LETTER:
  case Character.OTHER_LETTER:            return OTHER_LETTER;
  case Character.DECIMAL_DIGIT_NUMBER:    return DIGIT;
  default:                                return OTHER;
  }
}

public static boolean isLetterOrDigitOrPunc(char ch) {
  int i = Character.getType(ch);
  return Character.isLowerCase(ch) || Character.isUpperCase(ch)
   || Character.isDigit(ch)
      || (i>=20&&i<=30); 
  //TODO:可以修改为Java7中的isLetterOrDigit
  
  
}

System.out.println(Character.DECIMAL_DIGIT_NUMBER == Character.getType('१'));

public static void forbidUnassigned(int input) {
  if (Character.getType(input) == Character.UNASSIGNED) {
    throw log.unassignedCodePoint(input);
  }
}

/**
 * Generate next code point that is valid for composition of a string.
 * Additional limitation on code point range is given by method argument.
 *
 * @param maxCodePoint the maximum code point to consider
 * @return A pseudorandom valid code point
 */
private int nextValidCodePoint( int maxCodePoint )
{
  int codePoint;
  int type;
  do
  {
    codePoint = intBetween( Character.MIN_CODE_POINT, maxCodePoint );
    type = Character.getType( codePoint );
  }
  while ( type == Character.UNASSIGNED ||
      type == Character.PRIVATE_USE ||
      type == Character.SURROGATE );
  return codePoint;
}

final List<String> list = new ArrayList<>();
int tokenStart = 0;
int currentType = Character.getType(c[tokenStart]);
for (int pos = tokenStart + 1; pos < c.length; pos++) {
  final int type = Character.getType(c[pos]);
  if (type == currentType) {
    continue;

List list = new ArrayList();
int tokenStart = 0;
int currentType = Character.getType(c[tokenStart]);
for (int pos = tokenStart + 1; pos < c.length; pos++) {
  int type = Character.getType(c[pos]);
  if (type == currentType) {
    continue;

/**
 * Gets the Unicode directionality of the specified character.
 *
 * @param codePoint
 *            the Unicode code point to get the directionality of.
 * @return the Unicode directionality of {@code codePoint}.
 */
public static byte getDirectionality(int codePoint) {
  if (getType(codePoint) == Character.UNASSIGNED) {
    return Character.DIRECTIONALITY_UNDEFINED;
  }
  byte directionality = getDirectionalityImpl(codePoint);
  if (directionality == -1) {
    return -1;
  }
  return DIRECTIONALITY[directionality];
}

  private static boolean isSbeCSharpIdentifierPart(final char c)
  {
    if (isSbeCSharpIdentifierStart(c))
    {
      return true;
    }

    switch (Character.getType(c))
    {
      case Character.NON_SPACING_MARK: // Mn
      case Character.COMBINING_SPACING_MARK: // Mc
      case Character.DECIMAL_DIGIT_NUMBER: // Nd
      case Character.CONNECTOR_PUNCTUATION: // Pc
      case Character.FORMAT: // Cf
        return true;

      default:
        return false;
    }
  }
}

public static String getRandUnicodeString(Random r, int length) {
 StringBuilder sb = new StringBuilder();
 for (int i = 0; i < length; i++) {
  char ch;
  while (true) {
   int codePoint = MIN_RANDOM_CODEPOINT + r.nextInt(RANGE_RANDOM_CODEPOINT);
   if (!Character.isDefined(codePoint) ||
     Character.getType(codePoint) == Character.PRIVATE_USE) {
    continue;
   }
   ch = (char) codePoint;
   if (Character.isSurrogate(ch)) {
    continue;
   }
   break;
  }
  sb.append(ch);
 }
 return sb.toString();
}

@Description("decodes the UTF-8 encoded string")
@ScalarFunction
@SqlType(StandardTypes.VARCHAR)
public static Slice fromUtf8(@SqlType(StandardTypes.VARBINARY) Slice slice, @SqlType(StandardTypes.BIGINT) long replacementCodePoint)
{
  if (replacementCodePoint > MAX_CODE_POINT || Character.getType((int) replacementCodePoint) == SURROGATE) {
    throw new PrestoException(INVALID_FUNCTION_ARGUMENT, "Invalid replacement character");
  }
  return SliceUtf8.fixInvalidUtf8(slice, OptionalInt.of((int) replacementCodePoint));
}

private synchronized void processRawFrame(OutputFrame outputFrame, Consumer<OutputFrame> consumer) {
  String utf8String = outputFrame.getUtf8String();
  byte[] bytes = outputFrame.getBytes();
  // Merging the strings by bytes to solve the problem breaking non-latin unicode symbols.
  if (brokenFrame != null) {
    bytes = merge(brokenFrame.getBytes(), bytes);
    utf8String = new String(bytes);
    brokenFrame = null;
  }
  // Logger chunks can break the string in middle of multibyte unicode character.
  // Backup the bytes to reconstruct proper char sequence with bytes from next frame.
  int lastCharacterType = Character.getType(utf8String.charAt(utf8String.length() - 1));
  if (lastCharacterType == Character.OTHER_SYMBOL) {
    brokenFrame = new OutputFrame(outputFrame.getType(), bytes);
    return;
  }
  utf8String = processAnsiColorCodes(utf8String, consumer);
  normalizeLogLines(utf8String, consumer);
}

Javadoc

Gets the general Unicode category of the specified character.

Popular methods of Character

isWhitespace
Determines if the specified character (Unicode code point) is white space according to Java. A chara
isDigit
Determines if the specified character (Unicode code point) is a digit. A character is a digit if its
toUpperCase
Returns the upper case equivalent for the specified code point if the code point is a lower case let
toLowerCase
Returns the lower case equivalent for the specified code point if it is an upper case letter. Otherw
isUpperCase
Indicates whether the specified code point is an upper case letter.
toString
isLetter
Determines if the specified character (Unicode code point) is a letter. A character is considered to
isLetterOrDigit
Determines if the specified character (Unicode code point) is a letter or digit. A character is con
charValue
Returns the value of this Character object.
digit
Returns the numeric value of the specified character (Unicode code point) in the specified radix.If
isLowerCase
Indicates whether the specified code point is a lower case letter.
isJavaIdentifierPart
Determines if the character (Unicode code point) may be part of a Java identifier as other than the

Popular in Java

Reactive rest calls using spring rest template
orElseThrow (Optional)
Return the contained value, if present, otherwise throw an exception to be created by the provided s
getSharedPreferences (Context)
onRequestPermissionsResult (Fragment)
RandomAccessFile (java.io)
Allows reading from and writing to a file in a random-access manner. This is different from the uni-
SocketTimeoutException (java.net)
This exception is thrown when a timeout expired on a socket read or accept operation.
SQLException (java.sql)
An exception that indicates a failed JDBC operation. It provides the following information about pro
Timestamp (java.sql)
A Java representation of the SQL TIMESTAMP type. It provides the capability of representing the SQL
Arrays (java.util)
This class contains various methods for manipulating arrays (such as sorting and searching). This cl
XPath (javax.xml.xpath)
XPath provides access to the XPath evaluation environment and expressions. Evaluation of XPath Expr
Top plugins for WebStorm

How to use getTypemethodin java.lang.Character

Best Java code snippets using java.lang.Character.getType (Showing top 20 results out of 3,024)

How to use
getType
method
in
java.lang.Character