Ignore:
Timestamp:
Jun 9, 2016, 3:34:07 PM (3 years ago)
Author:
xuedongx
Message:

Support over UTF-16 representation of Unicode

File:
1 edited

Legend:

Unmodified
Added
Removed
  • icGREP/icgrep-devel/icgrep/re/re_compiler.h

    r5042 r5045  
    2323/*   Marker streams represent the results of matching steps.
    2424     Three types of marker streams are used internally.
    25      FinalMatchByte markers are used for character classes and
     25     FinalMatchUnit markers are used for character classes and
    2626     other strings identified by a one bit at their final position.
    27      InitialPostPositionByte markers are used to mark matches with
    28      a 1 bit immediately after a match.   InitialPostPositionByte markers
     27     InitialPostPositionUnit markers are used to mark matches with
     28     a 1 bit immediately after a match.   InitialPostPositionUnit markers
    2929     are generally required whenever a regular expression element
    3030     can match the empty string (e.g., * and ? repeated items).
    31      FinalPostPositionByte markers are used for single code unit
     31     FinalPostPositionUnit markers are used for single code unit
    3232     lookahead assertions. 
    3333*/
     
    3535namespace re {
    3636
    37 enum MarkerPosition {FinalMatchByte, InitialPostPositionByte, FinalPostPositionByte};
     37enum MarkerPosition {FinalMatchUnit, InitialPostPositionUnit, FinalPostPositionUnit};
    3838
    3939struct MarkerType {
     
    5353
    5454    RE_Compiler(pablo::PabloFunction & function, cc::CC_Compiler & ccCompiler);
    55     void initializeRequiredStreams();
     55    void initializeRequiredStreams(Encoding encoding);
    5656    void compileUnicodeNames(RE *& re);
    5757    void finalizeMatchResult(MarkerType match_result, bool InvertMatches = false);
     
    6262private:
    6363
     64    void initializeRequiredStreams_utf8();
     65    void initializeRequiredStreams_utf16();
    6466    MarkerType compile(RE * re, pablo::PabloBuilder & cg);
    6567
Note: See TracChangeset for help on using the changeset viewer.