Class MultiByteEncoding
java.lang.Object
org.graalvm.shadowed.org.jcodings.Encoding
org.graalvm.shadowed.org.jcodings.MultiByteEncoding
- All Implemented Interfaces:
Cloneable
- Direct Known Subclasses:
CanBeTrailTableEncoding,EmacsMuleEncoding,EucEncoding,GB18030Encoding,UnicodeEncoding
-
Field Summary
FieldsModifier and TypeFieldDescriptionprotected static final intprotected final int[]protected static final intprotected final int[][]protected final int[] -
Constructor Summary
ConstructorsModifierConstructorDescriptionprotectedMultiByteEncoding(String name, int minLength, int maxLength, int[] EncLen, int[][] Trans, short[] CTypeTable) -
Method Summary
Modifier and TypeMethodDescriptionvoidapplyAllCaseFold(int flag, ApplyAllCaseFoldFunction fun, Object arg) onigenc_ascii_apply_all_case_fold / used also by multibyte encodingsprotected final voidasciiApplyAllCaseFold(int flag, ApplyAllCaseFoldFunction fun, Object arg) protected final CaseFoldCodeItem[]asciiCaseFoldCodesByString(int flag, byte[] bytes, int p, int end) protected final intasciiMbcCaseFold(int flag, byte[] bytes, IntHolder pp, int end, byte[] lower) caseFoldCodesByString(int flag, byte[] bytes, int p, int end) onigenc_ascii_get_case_fold_codes_by_str / used also by multibyte encodingsintOniguruma equivalent:case_mapprotected final booleanisCodeCTypeInternal(int code, int ctype) ONIGENC_IS_XXXXXX_CODE_CTYPEstatic booleanisInRange(int code, int from, int to) booleanisNewLine(byte[] bytes, int p, int end) onigenc_is_mbc_newline_0x0a / used also by multibyte encodingsintlength(byte c) Returns character length given character head returns1for singlebyte encodings or performs direct length table lookup for multibyte ones.protected final intlengthForTwoUptoFour(byte[] bytes, int p, int end, int b, int s) protected final intmb2CodeToMbc(int code, byte[] bytes, int p) protected final intmb2CodeToMbcLength(int code) protected final booleanmb2IsCodeCType(int code, int ctype) protected final intmb4CodeToMbc(int code, byte[] bytes, int p) protected final intmb4CodeToMbcLength(int code) protected final booleanmb4IsCodeCType(int code, int ctype) intmbcCaseFold(int flag, byte[] bytes, IntHolder pp, int end, byte[] lower) onigenc_ascii_mbc_case_foldprotected final intmbnMbcCaseFold(int flag, byte[] bytes, IntHolder pp, int end, byte[] lower) protected final intmbnMbcToCode(byte[] bytes, int p, int end) protected final intmissing(int n) protected final intmissing(int b, int delta) intpropertyNameToCType(byte[] bytes, int p, int end) onigenc_minimum_property_name_to_ctype notably overridden by unicode encodingsprotected final intsafeLengthForUptoFour(byte[] bytes, int p, int end) protected final intsafeLengthForUptoThree(byte[] bytes, int p, int end) protected final intsafeLengthForUptoTwo(byte[] bytes, int p, int end) intstrCodeAt(byte[] bytes, int p, int end, int index) intstrLength(byte[] bytes, int p, int end) Methods inherited from class org.graalvm.shadowed.org.jcodings.Encoding
asciiToLower, asciiToUpper, codeToMbc, codeToMbcLength, ctypeCodeRange, digitVal, equals, getCharset, getCharsetName, getIndex, getName, hashCode, isAlnum, isAlpha, isAscii, isAscii, isAsciiCompatible, isBlank, isCntrl, isCodeCType, isDigit, isDummy, isFixedWidth, isGraph, isLower, isMbcAscii, isMbcCrnl, isMbcHead, isMbcWord, isNewLine, isPrint, isPunct, isReverseMatchAllowed, isSbWord, isSingleByte, isSpace, isUnicode, isUpper, isUTF8, isWord, isWordGraphPrint, isXDigit, leftAdjustCharHead, length, load, load, maxLength, maxLengthDistance, mbcodeStartPosition, mbcToCode, minLength, odigitVal, prevCharHead, rightAdjustCharHead, rightAdjustCharHeadWithPrev, setDummy, setName, setName, step, stepBack, strByteLengthNull, strLengthNull, strNCmp, toLowerCaseTable, toString, xdigitVal
-
Field Details
-
EncLen
protected final int[] EncLen -
A
protected static final int A- See Also:
-
F
protected static final int F- See Also:
-
Trans
protected final int[][] Trans -
TransZero
protected final int[] TransZero
-
-
Constructor Details
-
MultiByteEncoding
protected MultiByteEncoding(String name, int minLength, int maxLength, int[] EncLen, int[][] Trans, short[] CTypeTable)
-
-
Method Details
-
length
public int length(byte c) Description copied from class:EncodingReturns character length given character head returns1for singlebyte encodings or performs direct length table lookup for multibyte ones. -
missing
protected final int missing(int n) -
missing
protected final int missing(int b, int delta) -
safeLengthForUptoFour
protected final int safeLengthForUptoFour(byte[] bytes, int p, int end) -
lengthForTwoUptoFour
protected final int lengthForTwoUptoFour(byte[] bytes, int p, int end, int b, int s) -
safeLengthForUptoThree
protected final int safeLengthForUptoThree(byte[] bytes, int p, int end) -
safeLengthForUptoTwo
protected final int safeLengthForUptoTwo(byte[] bytes, int p, int end) -
mbnMbcToCode
protected final int mbnMbcToCode(byte[] bytes, int p, int end) -
caseMap
public int caseMap(IntHolder flagP, byte[] bytes, IntHolder pp, int end, byte[] to, int toP, int toEnd) Description copied from class:EncodingOniguruma equivalent:case_map -
mbnMbcCaseFold
-
mb2CodeToMbcLength
protected final int mb2CodeToMbcLength(int code) -
mb4CodeToMbcLength
protected final int mb4CodeToMbcLength(int code) -
mb2CodeToMbc
protected final int mb2CodeToMbc(int code, byte[] bytes, int p) -
mb4CodeToMbc
protected final int mb4CodeToMbc(int code, byte[] bytes, int p) -
mb2IsCodeCType
protected final boolean mb2IsCodeCType(int code, int ctype) -
mb4IsCodeCType
protected final boolean mb4IsCodeCType(int code, int ctype) -
strLength
public int strLength(byte[] bytes, int p, int end) -
strCodeAt
public int strCodeAt(byte[] bytes, int p, int end, int index) -
isInRange
public static boolean isInRange(int code, int from, int to) -
isCodeCTypeInternal
protected final boolean isCodeCTypeInternal(int code, int ctype) ONIGENC_IS_XXXXXX_CODE_CTYPE -
isNewLine
public boolean isNewLine(byte[] bytes, int p, int end) onigenc_is_mbc_newline_0x0a / used also by multibyte encodings -
asciiMbcCaseFold
-
mbcCaseFold
onigenc_ascii_mbc_case_fold- Specified by:
mbcCaseFoldin classEncoding- Parameters:
flag- case fold flagpp- anIntHolderthat points at character headlower- a buffer where to extract case folded character Oniguruma equivalent:mbc_case_fold
-
asciiApplyAllCaseFold
-
applyAllCaseFold
onigenc_ascii_apply_all_case_fold / used also by multibyte encodings- Specified by:
applyAllCaseFoldin classEncoding- Parameters:
flag- case fold flagfun- case folding functor (look at:ApplyCaseFold)arg- case folding functor argument (look at:ApplyCaseFoldArg) Oniguruma equivalent:apply_all_case_fold
-
asciiCaseFoldCodesByString
protected final CaseFoldCodeItem[] asciiCaseFoldCodesByString(int flag, byte[] bytes, int p, int end) -
caseFoldCodesByString
onigenc_ascii_get_case_fold_codes_by_str / used also by multibyte encodings- Specified by:
caseFoldCodesByStringin classEncoding
-
propertyNameToCType
public int propertyNameToCType(byte[] bytes, int p, int end) onigenc_minimum_property_name_to_ctype notably overridden by unicode encodings- Specified by:
propertyNameToCTypein classEncoding
-