public final class CharScript extends Object
Script related utilities.
This work was originally authored by Glenn Adams (gadams@apache.org).
Modifier and Type | Field and Description |
---|---|
static int |
SCRIPT_ARABIC
arabic script constant
|
static int |
SCRIPT_BENGALI
bengali script constant
|
static int |
SCRIPT_BENGALI_2
bengali 2 script constant
|
static int |
SCRIPT_BOPOMOFO
bopomofo script constant
|
static int |
SCRIPT_BURMESE
burmese script constant
|
static int |
SCRIPT_CYRILLIC
cyrillic script constant
|
static int |
SCRIPT_DEVANAGARI
devanagari script constant
|
static int |
SCRIPT_DEVANAGARI_2
devanagari 2 script constant
|
static int |
SCRIPT_ETHIOPIC
ethiopic script constant
|
static int |
SCRIPT_GEORGIAN
georgian script constant
|
static int |
SCRIPT_GREEK
greek script constant
|
static int |
SCRIPT_GUJARATI
gujarati script constant
|
static int |
SCRIPT_GUJARATI_2
gujarati 2 script constant
|
static int |
SCRIPT_GURMUKHI
gurmukhi script constant
|
static int |
SCRIPT_GURMUKHI_2
gurmukhi 2 script constant
|
static int |
SCRIPT_HAN
han script constant
|
static int |
SCRIPT_HANGUL
hangul script constant
|
static int |
SCRIPT_HEBREW
hebrew script constant
|
static int |
SCRIPT_HIRAGANA
hiragana script constant
|
static int |
SCRIPT_KANNADA
kannada script constant
|
static int |
SCRIPT_KANNADA_2
kannada 2 script constant
|
static int |
SCRIPT_KATAKANA
katakana script constant
|
static int |
SCRIPT_KHMER
khmer script constant
|
static int |
SCRIPT_LAO
lao script constant
|
static int |
SCRIPT_LATIN
latin script constant
|
static int |
SCRIPT_MALAYALAM
malayalam script constant
|
static int |
SCRIPT_MALAYALAM_2
malayalam 2 script constant
|
static int |
SCRIPT_MATH
math script constant
|
static int |
SCRIPT_MONGOLIAN
mongolian script constant
|
static int |
SCRIPT_ORIYA
oriya script constant
|
static int |
SCRIPT_ORIYA_2
oriya 2 script constant
|
static int |
SCRIPT_SINHALESE
sinhalese script constant
|
static int |
SCRIPT_SYMBOL
symbol script constant
|
static int |
SCRIPT_TAMIL
tamil script constant
|
static int |
SCRIPT_TAMIL_2
tamil 2 script constant
|
static int |
SCRIPT_TELUGU
telugu script constant
|
static int |
SCRIPT_TELUGU_2
telugu 2 script constant
|
static int |
SCRIPT_THAI
thai script constant
|
static int |
SCRIPT_TIBETAN
tibetan script constant
|
static int |
SCRIPT_UNCODED
uncoded script constant
|
static int |
SCRIPT_UNDETERMINED
undetermined script constant
|
Modifier and Type | Method and Description |
---|---|
static int |
dominantScript(CharSequence cs)
Determine the dominant script of a character sequence.
|
static boolean |
isArabic(int c)
Determine if character c belong to the arabic script.
|
static boolean |
isBengali(int c)
Determine if character c belong to the bengali script.
|
static boolean |
isBopomofo(int c)
Determine if character c belong to the bopomofo script.
|
static boolean |
isBurmese(int c)
Determine if character c belong to the burmese script.
|
static boolean |
isCyrillic(int c)
Determine if character c belong to the cyrillic script.
|
static boolean |
isDevanagari(int c)
Determine if character c belong to the devanagari script.
|
static boolean |
isDigit(int c)
Determine if character c is a digit.
|
static boolean |
isEthiopic(int c)
Determine if character c belong to the ethiopic (amharic) script.
|
static boolean |
isGeorgian(int c)
Determine if character c belong to the georgian script.
|
static boolean |
isGreek(int c)
Determine if character c belong to the greek script.
|
static boolean |
isGujarati(int c)
Determine if character c belong to the gujarati script.
|
static boolean |
isGurmukhi(int c)
Determine if character c belong to the gurmukhi script.
|
static boolean |
isHan(int c)
Determine if character c belong to the han (unified cjk) script.
|
static boolean |
isHangul(int c)
Determine if character c belong to the hangul script.
|
static boolean |
isHebrew(int c)
Determine if character c belong to the hebrew script.
|
static boolean |
isHiragana(int c)
Determine if character c belong to the hiragana script.
|
static boolean |
isIndicScript(int script)
Determine if script tag denotes an 'Indic' script, where a
script is an 'Indic' script if it is intended to be processed by
the generic 'Indic' Script Processor.
|
static boolean |
isIndicScript(String script)
Determine if script tag denotes an 'Indic' script, where a
script is an 'Indic' script if it is intended to be processed by
the generic 'Indic' Script Processor.
|
static boolean |
isKannada(int c)
Determine if character c belong to the kannada script.
|
static boolean |
isKatakana(int c)
Determine if character c belong to the katakana script.
|
static boolean |
isKhmer(int c)
Determine if character c belong to the khmer script.
|
static boolean |
isLao(int c)
Determine if character c belong to the lao script.
|
static boolean |
isLatin(int c)
Determine if character c belong to the latin script.
|
static boolean |
isMalayalam(int c)
Determine if character c belong to the malayalam script.
|
static boolean |
isMongolian(int c)
Determine if character c belong to the mongolian script.
|
static boolean |
isOriya(int c)
Determine if character c belong to the oriya script.
|
static boolean |
isPunctuation(int c)
Determine if character c is punctuation.
|
static boolean |
isSinhalese(int c)
Determine if character c belong to the sinhalese script.
|
static boolean |
isTamil(int c)
Determine if character c belong to the tamil script.
|
static boolean |
isTelugu(int c)
Determine if character c belong to the telugu script.
|
static boolean |
isThai(int c)
Determine if character c belong to the thai script.
|
static boolean |
isTibetan(int c)
Determine if character c belong to the tibetan script.
|
static int |
scriptCodeFromTag(String tag)
Determine the internal script code associated with a script tag.
|
static int |
scriptOf(int c)
Obtain ISO15924 numeric script code of character.
|
static int[] |
scriptsOf(CharSequence cs)
Obtain the script codes of each character in a character sequence.
|
static String |
scriptTagFromCode(int code)
Determine the script tag associated with an internal script code.
|
static int |
useV2IndicRules(int sc)
Obtain the V2 indic script code corresponding to V1 indic script code SC if
and only iff V2 indic rules apply; otherwise return SC.
|
public static final int SCRIPT_HEBREW
public static final int SCRIPT_MONGOLIAN
public static final int SCRIPT_ARABIC
public static final int SCRIPT_GREEK
public static final int SCRIPT_LATIN
public static final int SCRIPT_CYRILLIC
public static final int SCRIPT_GEORGIAN
public static final int SCRIPT_BOPOMOFO
public static final int SCRIPT_HANGUL
public static final int SCRIPT_GURMUKHI
public static final int SCRIPT_GURMUKHI_2
public static final int SCRIPT_DEVANAGARI
public static final int SCRIPT_DEVANAGARI_2
public static final int SCRIPT_GUJARATI
public static final int SCRIPT_GUJARATI_2
public static final int SCRIPT_BENGALI
public static final int SCRIPT_BENGALI_2
public static final int SCRIPT_ORIYA
public static final int SCRIPT_ORIYA_2
public static final int SCRIPT_TIBETAN
public static final int SCRIPT_TELUGU
public static final int SCRIPT_TELUGU_2
public static final int SCRIPT_KANNADA
public static final int SCRIPT_KANNADA_2
public static final int SCRIPT_TAMIL
public static final int SCRIPT_TAMIL_2
public static final int SCRIPT_MALAYALAM
public static final int SCRIPT_MALAYALAM_2
public static final int SCRIPT_SINHALESE
public static final int SCRIPT_BURMESE
public static final int SCRIPT_THAI
public static final int SCRIPT_KHMER
public static final int SCRIPT_LAO
public static final int SCRIPT_HIRAGANA
public static final int SCRIPT_ETHIOPIC
public static final int SCRIPT_HAN
public static final int SCRIPT_KATAKANA
public static final int SCRIPT_MATH
public static final int SCRIPT_SYMBOL
public static final int SCRIPT_UNDETERMINED
public static final int SCRIPT_UNCODED
public static boolean isPunctuation(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isDigit(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isHebrew(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isMongolian(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isArabic(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isGreek(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isLatin(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isCyrillic(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isGeorgian(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isHangul(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isGurmukhi(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isDevanagari(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isGujarati(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isBengali(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isOriya(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isTibetan(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isTelugu(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isKannada(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isTamil(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isMalayalam(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isSinhalese(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isBurmese(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isThai(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isKhmer(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isLao(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isEthiopic(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isHan(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isBopomofo(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isHiragana(int c)
c
- a character represented as a unicode scalar valuepublic static boolean isKatakana(int c)
c
- a character represented as a unicode scalar valuepublic static int scriptOf(int c)
c
- the character to obtain scriptpublic static int useV2IndicRules(int sc)
sc
- a V1 indic script codepublic static int[] scriptsOf(CharSequence cs)
cs
- the character sequencepublic static int dominantScript(CharSequence cs)
cs
- the character sequencepublic static boolean isIndicScript(String script)
script
- a script tagpublic static boolean isIndicScript(int script)
script
- a script codepublic static String scriptTagFromCode(int code)
code
- the script codepublic static int scriptCodeFromTag(String tag)
tag
- the script tagCopyright © 2025 Apache Software Foundation. All rights reserved.