org.joni.encoding.specific
Class UTF32LEEncoding

java.lang.Object
  extended by org.joni.encoding.Encoding
      extended by org.joni.encoding.MultiByteEncoding
          extended by org.joni.encoding.unicode.UnicodeEncoding
              extended by org.joni.encoding.specific.UTF32LEEncoding

public final class UTF32LEEncoding
extends UnicodeEncoding


Field Summary
protected static int[][] AsciiLowerMap
           
static byte[] AsciiToLowerCaseTable
           
static byte[] AsciiToUpperCaseTable
           
protected static CaseFoldCodeItem[] EMPTY_FOLD_CODES
           
static UTF32LEEncoding INSTANCE
           
 
Fields inherited from class org.joni.encoding.MultiByteEncoding
EncLen
 
Fields inherited from class org.joni.encoding.Encoding
hashCode, name, NEW_LINE
 
Constructor Summary
protected UTF32LEEncoding()
           
 
Method Summary
protected  void asciiApplyAllCaseFold(int flag, ApplyAllCaseFoldFunction fun, java.lang.Object arg)
           
protected  CaseFoldCodeItem[] asciiCaseFoldCodesByString(int flag, byte[] bytes, int p, int end)
           
protected  int asciiMbcCaseFold(int flag, byte[] bytes, IntHolder pp, int end, byte[] lower)
           
 int codeToMbc(int code, byte[] bytes, int p)
          Extracts code point into it's multibyte representation
 int codeToMbcLength(int code)
          Returns character length given a code point Oniguruma equivalent: code_to_mbclen
 int[] ctypeCodeRange(int ctype, IntHolder sbOut)
          onigenc_utf16_32_get_ctype_code_range
protected  boolean isCodeCTypeInternal(int code, int ctype)
          ONIGENC_IS_XXXXXX_CODE_CTYPE
 boolean isFixedWidth()
           
 boolean isNewLine(byte[] bytes, int p, int end)
          onigenc_is_mbc_newline_0x0a / used also by multibyte encodings
 boolean isReverseMatchAllowed(byte[] bytes, int p, int end)
          Returns true if it's safe to use reversal Boyer-Moore search fail fast algorithm Oniguruma equivalent: is_allowed_reverse_match
 int leftAdjustCharHead(byte[] bytes, int p, int end)
          Seeks the previous character head in a stream Oniguruma equivalent: left_adjust_char_head
 int length(byte c)
          Returns character length given the character head returns 1 for singlebyte encodings or performs direct length table lookup for multibyte ones.
 int maxLength()
          Returns maximum character byte length that can appear in an encoding Oniguruma equivalent: max_enc_len
 int mbcCaseFold(int flag, byte[] bytes, IntHolder pp, int end, byte[] fold)
          onigenc_ascii_mbc_case_fold
 int mbcToCode(byte[] bytes, int p, int end)
          Returns code point for a character Oniguruma equivalent: mbc_to_code
 int minLength()
          Returns minimum character byte length that can appear in an encoding Oniguruma equivalent: min_enc_len
 int strLength(byte[] bytes, int p, int end)
           
 java.lang.String toString()
           
 
Methods inherited from class org.joni.encoding.unicode.UnicodeEncoding
applyAllCaseFold, caseFoldCodesByString, ctypeCodeRange, isCodeCType, propertyNameToCType
 
Methods inherited from class org.joni.encoding.MultiByteEncoding
isSingleByte, mb2CodeToMbc, mb2CodeToMbcLength, mb2IsCodeCType, mb4CodeToMbc, mb4CodeToMbcLength, mb4IsCodeCType, mbnMbcCaseFold, mbnMbcToCode
 
Methods inherited from class org.joni.encoding.Encoding
asciiToLower, asciiToUpper, digitVal, equals, getName, hashCode, isAlnum, isAlpha, isAscii, isBlank, isCntrl, isDigit, isGraph, isLower, isMbcAscii, isMbcCrnl, isMbcHead, isMbcWord, isNewLine, isPrint, isPunct, isSbWord, isSpace, isUpper, isWord, isWordGraphPrint, isXDigit, maxLengthDistance, mbcodeStartPosition, odigitVal, prevCharHead, rightAdjustCharHead, rightAdjustCharHeadWithPrev, step, stepBack, strByteLengthNull, strLengthNull, strNCmp, toLowerCaseTable, xdigitVal
 
Methods inherited from class java.lang.Object
clone, finalize, getClass, notify, notifyAll, wait, wait, wait
 

Field Detail

INSTANCE

public static UTF32LEEncoding INSTANCE

AsciiToLowerCaseTable

public static final byte[] AsciiToLowerCaseTable

AsciiToUpperCaseTable

public static final byte[] AsciiToUpperCaseTable

AsciiLowerMap

protected static final int[][] AsciiLowerMap

EMPTY_FOLD_CODES

protected static final CaseFoldCodeItem[] EMPTY_FOLD_CODES
Constructor Detail

UTF32LEEncoding

protected UTF32LEEncoding()
Method Detail

length

public int length(byte c)
Description copied from class: Encoding
Returns character length given the character head returns 1 for singlebyte encodings or performs direct length table lookup for multibyte ones.

Overrides:
length in class MultiByteEncoding
Parameters:
c - Character head Oniguruma equivalent: mbc_enc_len

strLength

public int strLength(byte[] bytes,
                     int p,
                     int end)
Overrides:
strLength in class Encoding

toString

public java.lang.String toString()
Specified by:
toString in class Encoding

maxLength

public int maxLength()
Description copied from class: Encoding
Returns maximum character byte length that can appear in an encoding Oniguruma equivalent: max_enc_len

Specified by:
maxLength in class Encoding

minLength

public int minLength()
Description copied from class: Encoding
Returns minimum character byte length that can appear in an encoding Oniguruma equivalent: min_enc_len

Specified by:
minLength in class Encoding

isFixedWidth

public boolean isFixedWidth()
Specified by:
isFixedWidth in class Encoding

isNewLine

public boolean isNewLine(byte[] bytes,
                         int p,
                         int end)
onigenc_is_mbc_newline_0x0a / used also by multibyte encodings


mbcToCode

public int mbcToCode(byte[] bytes,
                     int p,
                     int end)
Description copied from class: Encoding
Returns code point for a character Oniguruma equivalent: mbc_to_code

Specified by:
mbcToCode in class Encoding

codeToMbcLength

public int codeToMbcLength(int code)
Description copied from class: Encoding
Returns character length given a code point Oniguruma equivalent: code_to_mbclen

Specified by:
codeToMbcLength in class Encoding

codeToMbc

public int codeToMbc(int code,
                     byte[] bytes,
                     int p)
Description copied from class: Encoding
Extracts code point into it's multibyte representation

Specified by:
codeToMbc in class Encoding
Returns:
character length for the given code point Oniguruma equivalent: code_to_mbc

mbcCaseFold

public int mbcCaseFold(int flag,
                       byte[] bytes,
                       IntHolder pp,
                       int end,
                       byte[] fold)
onigenc_ascii_mbc_case_fold

Overrides:
mbcCaseFold in class UnicodeEncoding
Parameters:
flag - case fold flag
pp - an IntHolder that points at character head
fold - a buffer where to extract case folded character Oniguruma equivalent: mbc_case_fold

ctypeCodeRange

public int[] ctypeCodeRange(int ctype,
                            IntHolder sbOut)
onigenc_utf16_32_get_ctype_code_range

Specified by:
ctypeCodeRange in class Encoding

leftAdjustCharHead

public int leftAdjustCharHead(byte[] bytes,
                              int p,
                              int end)
Description copied from class: Encoding
Seeks the previous character head in a stream Oniguruma equivalent: left_adjust_char_head

Specified by:
leftAdjustCharHead in class Encoding

isReverseMatchAllowed

public boolean isReverseMatchAllowed(byte[] bytes,
                                     int p,
                                     int end)
Description copied from class: Encoding
Returns true if it's safe to use reversal Boyer-Moore search fail fast algorithm Oniguruma equivalent: is_allowed_reverse_match

Specified by:
isReverseMatchAllowed in class Encoding

isCodeCTypeInternal

protected final boolean isCodeCTypeInternal(int code,
                                            int ctype)
ONIGENC_IS_XXXXXX_CODE_CTYPE


asciiMbcCaseFold

protected final int asciiMbcCaseFold(int flag,
                                     byte[] bytes,
                                     IntHolder pp,
                                     int end,
                                     byte[] lower)

asciiApplyAllCaseFold

protected final void asciiApplyAllCaseFold(int flag,
                                           ApplyAllCaseFoldFunction fun,
                                           java.lang.Object arg)

asciiCaseFoldCodesByString

protected final CaseFoldCodeItem[] asciiCaseFoldCodesByString(int flag,
                                                              byte[] bytes,
                                                              int p,
                                                              int end)


Copyright © 2008. All Rights Reserved.