public final class CharScript
extends java.lang.Object
Script related utilities.
This work was originally authored by Glenn Adams (gadams@apache.org).
Modifier and Type | Field | Description |
---|---|---|
static int |
SCRIPT_ARABIC |
arabic script constant
|
static int |
SCRIPT_BENGALI |
bengali script constant
|
static int |
SCRIPT_BENGALI_2 |
bengali 2 script constant
|
static int |
SCRIPT_BOPOMOFO |
bopomofo script constant
|
static int |
SCRIPT_BURMESE |
burmese script constant
|
static int |
SCRIPT_CYRILLIC |
cyrillic script constant
|
static int |
SCRIPT_DEVANAGARI |
devanagari script constant
|
static int |
SCRIPT_DEVANAGARI_2 |
devanagari 2 script constant
|
static int |
SCRIPT_ETHIOPIC |
ethiopic script constant
|
static int |
SCRIPT_GEORGIAN |
georgian script constant
|
static int |
SCRIPT_GREEK |
greek script constant
|
static int |
SCRIPT_GUJARATI |
gujarati script constant
|
static int |
SCRIPT_GUJARATI_2 |
gujarati 2 script constant
|
static int |
SCRIPT_GURMUKHI |
gurmukhi script constant
|
static int |
SCRIPT_GURMUKHI_2 |
gurmukhi 2 script constant
|
static int |
SCRIPT_HAN |
han script constant
|
static int |
SCRIPT_HANGUL |
hangul script constant
|
static int |
SCRIPT_HEBREW |
hebrew script constant
|
static int |
SCRIPT_HIRAGANA |
hiragana script constant
|
static int |
SCRIPT_KANNADA |
kannada script constant
|
static int |
SCRIPT_KANNADA_2 |
kannada 2 script constant
|
static int |
SCRIPT_KATAKANA |
katakana script constant
|
static int |
SCRIPT_KHMER |
khmer script constant
|
static int |
SCRIPT_LAO |
lao script constant
|
static int |
SCRIPT_LATIN |
latin script constant
|
static int |
SCRIPT_MALAYALAM |
malayalam script constant
|
static int |
SCRIPT_MALAYALAM_2 |
malayalam 2 script constant
|
static int |
SCRIPT_MATH |
math script constant
|
static int |
SCRIPT_MONGOLIAN |
mongolian script constant
|
static int |
SCRIPT_ORIYA |
oriya script constant
|
static int |
SCRIPT_ORIYA_2 |
oriya 2 script constant
|
static int |
SCRIPT_SINHALESE |
sinhalese script constant
|
static int |
SCRIPT_SYMBOL |
symbol script constant
|
static int |
SCRIPT_TAMIL |
tamil script constant
|
static int |
SCRIPT_TAMIL_2 |
tamil 2 script constant
|
static int |
SCRIPT_TELUGU |
telugu script constant
|
static int |
SCRIPT_TELUGU_2 |
telugu 2 script constant
|
static int |
SCRIPT_THAI |
thai script constant
|
static int |
SCRIPT_TIBETAN |
tibetan script constant
|
static int |
SCRIPT_UNCODED |
uncoded script constant
|
static int |
SCRIPT_UNDETERMINED |
undetermined script constant
|
Modifier and Type | Method | Description |
---|---|---|
static int |
dominantScript(java.lang.CharSequence cs) |
Determine the dominant script of a character sequence.
|
static boolean |
isArabic(int c) |
Determine if character c belong to the arabic script.
|
static boolean |
isBengali(int c) |
Determine if character c belong to the bengali script.
|
static boolean |
isBopomofo(int c) |
Determine if character c belong to the bopomofo script.
|
static boolean |
isBurmese(int c) |
Determine if character c belong to the burmese script.
|
static boolean |
isCyrillic(int c) |
Determine if character c belong to the cyrillic script.
|
static boolean |
isDevanagari(int c) |
Determine if character c belong to the devanagari script.
|
static boolean |
isDigit(int c) |
Determine if character c is a digit.
|
static boolean |
isEthiopic(int c) |
Determine if character c belong to the ethiopic (amharic) script.
|
static boolean |
isGeorgian(int c) |
Determine if character c belong to the georgian script.
|
static boolean |
isGreek(int c) |
Determine if character c belong to the greek script.
|
static boolean |
isGujarati(int c) |
Determine if character c belong to the gujarati script.
|
static boolean |
isGurmukhi(int c) |
Determine if character c belong to the gurmukhi script.
|
static boolean |
isHan(int c) |
Determine if character c belong to the han (unified cjk) script.
|
static boolean |
isHangul(int c) |
Determine if character c belong to the hangul script.
|
static boolean |
isHebrew(int c) |
Determine if character c belong to the hebrew script.
|
static boolean |
isHiragana(int c) |
Determine if character c belong to the hiragana script.
|
static boolean |
isIndicScript(int script) |
Determine if script tag denotes an 'Indic' script, where a
script is an 'Indic' script if it is intended to be processed by
the generic 'Indic' Script Processor.
|
static boolean |
isIndicScript(java.lang.String script) |
Determine if script tag denotes an 'Indic' script, where a
script is an 'Indic' script if it is intended to be processed by
the generic 'Indic' Script Processor.
|
static boolean |
isKannada(int c) |
Determine if character c belong to the kannada script.
|
static boolean |
isKatakana(int c) |
Determine if character c belong to the katakana script.
|
static boolean |
isKhmer(int c) |
Determine if character c belong to the khmer script.
|
static boolean |
isLao(int c) |
Determine if character c belong to the lao script.
|
static boolean |
isLatin(int c) |
Determine if character c belong to the latin script.
|
static boolean |
isMalayalam(int c) |
Determine if character c belong to the malayalam script.
|
static boolean |
isMongolian(int c) |
Determine if character c belong to the mongolian script.
|
static boolean |
isOriya(int c) |
Determine if character c belong to the oriya script.
|
static boolean |
isPunctuation(int c) |
Determine if character c is punctuation.
|
static boolean |
isSinhalese(int c) |
Determine if character c belong to the sinhalese script.
|
static boolean |
isTamil(int c) |
Determine if character c belong to the tamil script.
|
static boolean |
isTelugu(int c) |
Determine if character c belong to the telugu script.
|
static boolean |
isThai(int c) |
Determine if character c belong to the thai script.
|
static boolean |
isTibetan(int c) |
Determine if character c belong to the tibetan script.
|
static int |
scriptCodeFromTag(java.lang.String tag) |
Determine the internal script code associated with a script tag.
|
static int |
scriptOf(int c) |
Obtain ISO15924 numeric script code of character.
|
static int[] |
scriptsOf(java.lang.CharSequence cs) |
Obtain the script codes of each character in a character sequence.
|
static java.lang.String |
scriptTagFromCode(int code) |
Determine the script tag associated with an internal script code.
|
static int |
useV2IndicRules(int sc) |
Obtain the V2 indic script code corresponding to V1 indic script code SC if
and only iff V2 indic rules apply; otherwise return SC.
|
public static final int SCRIPT_HEBREW
public static final int SCRIPT_MONGOLIAN
public static final int SCRIPT_ARABIC
public static final int SCRIPT_GREEK
public static final int SCRIPT_LATIN
public static final int SCRIPT_CYRILLIC
public static final int SCRIPT_GEORGIAN
public static final int SCRIPT_BOPOMOFO
public static final int SCRIPT_HANGUL
public static final int SCRIPT_GURMUKHI
public static final int SCRIPT_GURMUKHI_2
public static final int SCRIPT_DEVANAGARI
public static final int SCRIPT_DEVANAGARI_2
public static final int SCRIPT_GUJARATI
public static final int SCRIPT_GUJARATI_2
public static final int SCRIPT_BENGALI
public static final int SCRIPT_BENGALI_2
public static final int SCRIPT_ORIYA
public static final int SCRIPT_ORIYA_2
public static final int SCRIPT_TIBETAN
public static final int SCRIPT_TELUGU
public static final int SCRIPT_TELUGU_2
public static final int SCRIPT_KANNADA
public static final int SCRIPT_KANNADA_2
public static final int SCRIPT_TAMIL
public static final int SCRIPT_TAMIL_2
public static final int SCRIPT_MALAYALAM
public static final int SCRIPT_MALAYALAM_2
public static final int SCRIPT_SINHALESE
public static final int SCRIPT_BURMESE
public static final int SCRIPT_THAI
public static final int SCRIPT_KHMER
public static final int SCRIPT_LAO
public static final int SCRIPT_HIRAGANA
public static final int SCRIPT_ETHIOPIC
public static final int SCRIPT_HAN
public static final int SCRIPT_KATAKANA
public static final int SCRIPT_MATH
public static final int SCRIPT_SYMBOL
public static final int SCRIPT_UNDETERMINED
public static final int SCRIPT_UNCODED
public static boolean isPunctuation(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isDigit(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isHebrew(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isMongolian(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isArabic(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isGreek(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isLatin(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isCyrillic(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isGeorgian(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isHangul(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isGurmukhi(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isDevanagari(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isGujarati(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isBengali(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isOriya(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isTibetan(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isTelugu(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isKannada(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isTamil(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isMalayalam(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isSinhalese(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isBurmese(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isThai(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isKhmer(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isLao(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isEthiopic(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isHan(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isBopomofo(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isHiragana(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isKatakana(int c)
c
- a character represented as a unicode scalar valuepublic static int scriptOf(int c)
c
- the character to obtain scriptpublic static int useV2IndicRules(int sc)
sc
- a V1 indic script codepublic static int[] scriptsOf(java.lang.CharSequence cs)
cs
- the character sequencepublic static int dominantScript(java.lang.CharSequence cs)
cs
- the character sequencepublic static boolean isIndicScript(java.lang.String script)
script
- a script tagpublic static boolean isIndicScript(int script)
script
- a script codepublic static java.lang.String scriptTagFromCode(int code)
code
- the script codepublic static int scriptCodeFromTag(java.lang.String tag)
tag
- the script tagCopyright 1999-2016 The Apache Software Foundation. All Rights Reserved.