Ruby 1.9.3p327(2012-11-10revision37606)
Defines | Enumerations | Functions | Variables
enc/utf_8.c File Reference
#include "regenc.h"
Include dependency graph for utf_8.c:

Go to the source code of this file.

Defines

#define USE_INVALID_CODE_SCHEME
#define INVALID_CODE_FE   0xfffffffe
#define INVALID_CODE_FF   0xffffffff
#define VALID_CODE_LIMIT   0x7fffffff
#define utf8_islead(c)   ((UChar )((c) & 0xc0) != 0x80)
#define A   ACCEPT
#define F   FAILURE
#define UTF8_TRAILS(code, shift)   (UChar )((((code) >> (shift)) & 0x3f) | 0x80)
#define UTF8_TRAIL0(code)   (UChar )(((code) & 0x3f) | 0x80)

Enumerations

enum  state_t {
  FAILURE = -2, ACCEPT = -1, S0 = 0, S1,
  FAILURE = -2, ACCEPT = -1, S0 = 0, S1,
  FAILURE = -2, ACCEPT = -1, S0 = 0, S1,
  S2, S3, S4, S5,
  S6, FAILURE = -2, ACCEPT = -1, S0 = 0,
  S1, S2, FAILURE = -2, ACCEPT = -1,
  S0 = 0, S1, FAILURE = -2, ACCEPT = -1,
  S0 = 0, S1, S2, S3,
  FAILURE = -2, ACCEPT = -1, S0 = 0, S1,
  S2, S3, FAILURE = -2, ACCEPT = -1,
  S0 = 0, S1, FAILURE = -2, ACCEPT = -1,
  S0 = 0, S1, FAILURE = -2, ACCEPT,
  S0, S1, S2, S3,
  S4, S5, S6, S7
}

Functions

static int mbc_enc_len (const UChar *p, const UChar *e, OnigEncoding enc ARG_UNUSED)
static int is_mbc_newline (const UChar *p, const UChar *end, OnigEncoding enc)
static OnigCodePoint mbc_to_code (const UChar *p, const UChar *end, OnigEncoding enc)
static int code_to_mbclen (OnigCodePoint code, OnigEncoding enc ARG_UNUSED)
static int code_to_mbc (OnigCodePoint code, UChar *buf, OnigEncoding enc ARG_UNUSED)
static int mbc_case_fold (OnigCaseFoldType flag, const UChar **pp, const UChar *end, UChar *fold, OnigEncoding enc)
static int get_ctype_code_range (OnigCtype ctype, OnigCodePoint *sb_out, const OnigCodePoint *ranges[], OnigEncoding enc ARG_UNUSED)
static UChar * left_adjust_char_head (const UChar *start, const UChar *s, const UChar *end, OnigEncoding enc ARG_UNUSED)
static int get_case_fold_codes_by_str (OnigCaseFoldType flag, const OnigUChar *p, const OnigUChar *end, OnigCaseFoldCodeItem items[], OnigEncoding enc)
 OnigEncodingDefine (utf_8, UTF_8)

Variables

static const int EncLen_UTF8 []
static const signed char trans [][0x100]

Define Documentation

#define A   ACCEPT

Definition at line 68 of file utf_8.c.

#define F   FAILURE

Definition at line 69 of file utf_8.c.

#define INVALID_CODE_FE   0xfffffffe

Definition at line 36 of file utf_8.c.

Referenced by code_to_mbc(), code_to_mbclen(), and mbc_to_code().

#define INVALID_CODE_FF   0xffffffff

Definition at line 37 of file utf_8.c.

Referenced by code_to_mbc(), code_to_mbclen(), and mbc_to_code().

#define USE_INVALID_CODE_SCHEME

Definition at line 32 of file utf_8.c.

#define utf8_islead (   c)    ((UChar )((c) & 0xc0) != 0x80)

Definition at line 41 of file utf_8.c.

Referenced by left_adjust_char_head().

#define UTF8_TRAIL0 (   code)    (UChar )(((code) & 0x3f) | 0x80)

Referenced by code_to_mbc().

#define UTF8_TRAILS (   code,
  shift 
)    (UChar )((((code) >> (shift)) & 0x3f) | 0x80)

Referenced by code_to_mbc().

#define VALID_CODE_LIMIT   0x7fffffff

Definition at line 38 of file utf_8.c.


Enumeration Type Documentation

enum state_t
Enumerator:
FAILURE 
ACCEPT 
S0 
S1 
FAILURE 
ACCEPT 
S0 
S1 
FAILURE 
ACCEPT 
S0 
S1 
S2 
S3 
S4 
S5 
S6 
FAILURE 
ACCEPT 
S0 
S1 
S2 
FAILURE 
ACCEPT 
S0 
S1 
FAILURE 
ACCEPT 
S0 
S1 
S2 
S3 
FAILURE 
ACCEPT 
S0 
S1 
S2 
S3 
FAILURE 
ACCEPT 
S0 
S1 
FAILURE 
ACCEPT 
S0 
S1 
FAILURE 
ACCEPT 
S0 
S1 
S2 
S3 
S4 
S5 
S6 
S7 

Definition at line 62 of file utf_8.c.


Function Documentation

static int code_to_mbc ( OnigCodePoint  code,
UChar *  buf,
OnigEncoding enc  ARG_UNUSED 
) [static]
static int code_to_mbclen ( OnigCodePoint  code,
OnigEncoding enc  ARG_UNUSED 
) [static]

Definition at line 297 of file utf_8.c.

References INVALID_CODE_FE, INVALID_CODE_FF, and ONIGERR_TOO_BIG_WIDE_CHAR_VALUE.

static int get_case_fold_codes_by_str ( OnigCaseFoldType  flag,
const OnigUChar p,
const OnigUChar end,
OnigCaseFoldCodeItem  items[],
OnigEncoding enc   
) [static]

Definition at line 420 of file utf_8.c.

References onigenc_unicode_get_case_fold_codes_by_str().

static int get_ctype_code_range ( OnigCtype  ctype,
OnigCodePoint sb_out,
const OnigCodePoint ranges[],
OnigEncoding enc  ARG_UNUSED 
) [static]

Definition at line 399 of file utf_8.c.

References onigenc_unicode_ctype_code_range().

static int is_mbc_newline ( const UChar *  p,
const UChar *  end,
OnigEncoding  enc 
) [static]

Definition at line 245 of file utf_8.c.

static UChar* left_adjust_char_head ( const UChar *  start,
const UChar *  s,
const UChar *  end,
OnigEncoding enc  ARG_UNUSED 
) [static]

Definition at line 408 of file utf_8.c.

References UChar, and utf8_islead.

static int mbc_case_fold ( OnigCaseFoldType  flag,
const UChar **  pp,
const UChar *  end,
UChar *  fold,
OnigEncoding  enc 
) [static]
static int mbc_enc_len ( const UChar *  p,
const UChar *  e,
OnigEncoding enc  ARG_UNUSED 
) [static]
static OnigCodePoint mbc_to_code ( const UChar *  p,
const UChar *  end,
OnigEncoding  enc 
) [static]

Definition at line 270 of file utf_8.c.

References enclen, INVALID_CODE_FE, INVALID_CODE_FF, and len.

OnigEncodingDefine ( utf_8  ,
UTF_8   
)

Variable Documentation

const int EncLen_UTF8[] [static]
Initial value:
 {
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
  2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
  2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
  3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
  4, 4, 4, 4, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
}

Definition at line 43 of file utf_8.c.

Referenced by mbc_enc_len().

const signed char trans[][0x100] [static]

Definition at line 70 of file utf_8.c.

Referenced by mbc_enc_len().