org.joni.encoding.unicode
Class UnicodeEncoding

java.lang.Object
  extended by org.joni.encoding.Encoding
      extended by org.joni.encoding.MultiByteEncoding
          extended by org.joni.encoding.unicode.UnicodeEncoding
Direct Known Subclasses:
UTF16BEEncoding, UTF16LEEncoding, UTF32BEEncoding, UTF32LEEncoding, UTF8Encoding

public abstract class UnicodeEncoding
extends MultiByteEncoding


Field Summary
protected static int[][] AsciiLowerMap
           
static byte[] AsciiToLowerCaseTable
           
static byte[] AsciiToUpperCaseTable
           
protected static CaseFoldCodeItem[] EMPTY_FOLD_CODES
           
 
Fields inherited from class org.joni.encoding.MultiByteEncoding
EncLen
 
Fields inherited from class org.joni.encoding.Encoding
hashCode, name, NEW_LINE
 
Constructor Summary
protected UnicodeEncoding(int[] EncLen)
           
 
Method Summary
 void applyAllCaseFold(int flag, ApplyAllCaseFoldFunction fun, java.lang.Object arg)
          onigenc_ascii_apply_all_case_fold / used also by multibyte encodings
protected  void asciiApplyAllCaseFold(int flag, ApplyAllCaseFoldFunction fun, java.lang.Object arg)
           
protected  CaseFoldCodeItem[] asciiCaseFoldCodesByString(int flag, byte[] bytes, int p, int end)
           
protected  int asciiMbcCaseFold(int flag, byte[] bytes, IntHolder pp, int end, byte[] lower)
           
 CaseFoldCodeItem[] caseFoldCodesByString(int flag, byte[] bytes, int p, int end)
          onigenc_ascii_get_case_fold_codes_by_str / used also by multibyte encodings
protected  int[] ctypeCodeRange(int ctype)
           
 boolean isCodeCType(int code, int ctype)
          Perform a check whether given code is of given character type (e.g.
protected  boolean isCodeCTypeInternal(int code, int ctype)
          ONIGENC_IS_XXXXXX_CODE_CTYPE
 boolean isNewLine(byte[] bytes, int p, int end)
          onigenc_is_mbc_newline_0x0a / used also by multibyte encodings
 int mbcCaseFold(int flag, byte[] bytes, IntHolder pp, int end, byte[] fold)
          onigenc_ascii_mbc_case_fold
 int propertyNameToCType(byte[] name, int p, int end)
          onigenc_minimum_property_name_to_ctype notably overridden by unicode encodings
 
Methods inherited from class org.joni.encoding.MultiByteEncoding
isSingleByte, length, mb2CodeToMbc, mb2CodeToMbcLength, mb2IsCodeCType, mb4CodeToMbc, mb4CodeToMbcLength, mb4IsCodeCType, mbnMbcCaseFold, mbnMbcToCode
 
Methods inherited from class org.joni.encoding.Encoding
asciiToLower, asciiToUpper, codeToMbc, codeToMbcLength, ctypeCodeRange, digitVal, equals, getName, hashCode, isAlnum, isAlpha, isAscii, isBlank, isCntrl, isDigit, isFixedWidth, isGraph, isLower, isMbcAscii, isMbcCrnl, isMbcHead, isMbcWord, isNewLine, isPrint, isPunct, isReverseMatchAllowed, isSbWord, isSpace, isUpper, isWord, isWordGraphPrint, isXDigit, leftAdjustCharHead, maxLength, maxLengthDistance, mbcodeStartPosition, mbcToCode, minLength, odigitVal, prevCharHead, rightAdjustCharHead, rightAdjustCharHeadWithPrev, step, stepBack, strByteLengthNull, strLength, strLengthNull, strNCmp, toLowerCaseTable, toString, xdigitVal
 
Methods inherited from class java.lang.Object
clone, finalize, getClass, notify, notifyAll, wait, wait, wait
 

Field Detail

AsciiToLowerCaseTable

public static final byte[] AsciiToLowerCaseTable

AsciiToUpperCaseTable

public static final byte[] AsciiToUpperCaseTable

AsciiLowerMap

protected static final int[][] AsciiLowerMap

EMPTY_FOLD_CODES

protected static final CaseFoldCodeItem[] EMPTY_FOLD_CODES
Constructor Detail

UnicodeEncoding

protected UnicodeEncoding(int[] EncLen)
Method Detail

isCodeCType

public boolean isCodeCType(int code,
                           int ctype)
Description copied from class: Encoding
Perform a check whether given code is of given character type (e.g. used by isWord(someByte) and similar methods)

Specified by:
isCodeCType in class Encoding
Parameters:
code - a code point of a character
ctype - a character type to check against Oniguruma equivalent: is_code_ctype

ctypeCodeRange

protected final int[] ctypeCodeRange(int ctype)

propertyNameToCType

public int propertyNameToCType(byte[] name,
                               int p,
                               int end)
onigenc_minimum_property_name_to_ctype notably overridden by unicode encodings


mbcCaseFold

public int mbcCaseFold(int flag,
                       byte[] bytes,
                       IntHolder pp,
                       int end,
                       byte[] fold)
onigenc_ascii_mbc_case_fold

Parameters:
flag - case fold flag
pp - an IntHolder that points at character head
fold - a buffer where to extract case folded character Oniguruma equivalent: mbc_case_fold

applyAllCaseFold

public void applyAllCaseFold(int flag,
                             ApplyAllCaseFoldFunction fun,
                             java.lang.Object arg)
onigenc_ascii_apply_all_case_fold / used also by multibyte encodings

Parameters:
flag - case fold flag
fun - case folding functor (look at: ApplyCaseFold)
arg - case folding functor argument (look at: ApplyCaseFoldArg) Oniguruma equivalent: apply_all_case_fold

caseFoldCodesByString

public CaseFoldCodeItem[] caseFoldCodesByString(int flag,
                                                byte[] bytes,
                                                int p,
                                                int end)
onigenc_ascii_get_case_fold_codes_by_str / used also by multibyte encodings


isCodeCTypeInternal

protected final boolean isCodeCTypeInternal(int code,
                                            int ctype)
ONIGENC_IS_XXXXXX_CODE_CTYPE


isNewLine

public boolean isNewLine(byte[] bytes,
                         int p,
                         int end)
onigenc_is_mbc_newline_0x0a / used also by multibyte encodings

Specified by:
isNewLine in class Encoding

asciiMbcCaseFold

protected final int asciiMbcCaseFold(int flag,
                                     byte[] bytes,
                                     IntHolder pp,
                                     int end,
                                     byte[] lower)

asciiApplyAllCaseFold

protected final void asciiApplyAllCaseFold(int flag,
                                           ApplyAllCaseFoldFunction fun,
                                           java.lang.Object arg)

asciiCaseFoldCodesByString

protected final CaseFoldCodeItem[] asciiCaseFoldCodesByString(int flag,
                                                              byte[] bytes,
                                                              int p,
                                                              int end)


Copyright © 2008. All Rights Reserved.