File:  [ELWIX - Embedded LightWeight unIX -] / embedaddon / pcre / testdata / testoutput18
Revision 1.1.1.2 (vendor branch): download - view: text, annotated - select for diffs - revision graph
Tue Oct 9 09:19:18 2012 UTC (12 years, 6 months ago) by misho
Branches: pcre, MAIN
CVS tags: v8_31, HEAD
pcre

    1: /-- This set of tests is for UTF-16 support, and is relevant only to the 16-bit
    2:     library. --/
    3: 
    4: /xxx/8?DZSS
    5: **Failed: invalid UTF-8 string cannot be converted to UTF-16
    6: 
    7: /abc/8
    8:     ]
    9: **Failed: invalid UTF-8 string cannot be converted to UTF-16
   10: 
   11: /X(\C{3})/8
   12:     X\x{11234}Y
   13:  0: X\x{11234}Y
   14:  1: \x{11234}Y
   15: 
   16: /X(\C{4})/8
   17:     X\x{11234}YZ
   18:  0: X\x{11234}YZ
   19:  1: \x{11234}YZ
   20: 
   21: /X\C*/8
   22:     XYZabcdce
   23:  0: XYZabcdce
   24: 
   25: /X\C*?/8
   26:     XYZabcde
   27:  0: X
   28: 
   29: /X\C{3,5}/8
   30:     Xabcdefg
   31:  0: Xabcde
   32:     X\x{11234}Y
   33:  0: X\x{11234}Y
   34:     X\x{11234}YZ
   35:  0: X\x{11234}YZ
   36:     X\x{11234}\x{512}
   37:  0: X\x{11234}\x{512}
   38:     X\x{11234}\x{512}YZ
   39:  0: X\x{11234}\x{512}YZ
   40:     X\x{11234}\x{512}\x{11234}Z
   41:  0: X\x{11234}\x{512}\x{11234}
   42: 
   43: /X\C{3,5}?/8
   44:     Xabcdefg
   45:  0: Xabc
   46:     X\x{11234}Y
   47:  0: X\x{11234}Y
   48:     X\x{11234}YZ
   49:  0: X\x{11234}Y
   50:     X\x{11234}\x{512}YZ
   51:  0: X\x{11234}\x{512}
   52:     *** Failers
   53: No match
   54:     X\x{11234}
   55: No match
   56: 
   57: /a\Cb/8
   58:     aXb
   59:  0: aXb
   60:     a\nb
   61:  0: a\x{0a}b
   62: 
   63: /a\C\Cb/8
   64:     a\x{12257}b
   65:  0: a\x{12257}b
   66:     ** Failers
   67: No match
   68:     a\x{100}b
   69: No match
   70: 
   71: /ab\Cde/8
   72:     abXde
   73:  0: abXde
   74: 
   75: /-- Check maximum character size --/
   76: 
   77: /\x{ffff}/8DZ
   78: ------------------------------------------------------------------
   79:         Bra
   80:         \x{ffff}
   81:         Ket
   82:         End
   83: ------------------------------------------------------------------
   84: Capturing subpattern count = 0
   85: Options: utf
   86: First char = \x{ffff}
   87: No need char
   88: 
   89: /\x{10000}/8DZ
   90: ------------------------------------------------------------------
   91:         Bra
   92:         \x{10000}
   93:         Ket
   94:         End
   95: ------------------------------------------------------------------
   96: Capturing subpattern count = 0
   97: Options: utf
   98: First char = \x{d800}
   99: Need char = \x{dc00}
  100: 
  101: /\x{100}/8DZ
  102: ------------------------------------------------------------------
  103:         Bra
  104:         \x{100}
  105:         Ket
  106:         End
  107: ------------------------------------------------------------------
  108: Capturing subpattern count = 0
  109: Options: utf
  110: First char = \x{100}
  111: No need char
  112: 
  113: /\x{1000}/8DZ
  114: ------------------------------------------------------------------
  115:         Bra
  116:         \x{1000}
  117:         Ket
  118:         End
  119: ------------------------------------------------------------------
  120: Capturing subpattern count = 0
  121: Options: utf
  122: First char = \x{1000}
  123: No need char
  124: 
  125: /\x{10000}/8DZ
  126: ------------------------------------------------------------------
  127:         Bra
  128:         \x{10000}
  129:         Ket
  130:         End
  131: ------------------------------------------------------------------
  132: Capturing subpattern count = 0
  133: Options: utf
  134: First char = \x{d800}
  135: Need char = \x{dc00}
  136: 
  137: /\x{100000}/8DZ
  138: ------------------------------------------------------------------
  139:         Bra
  140:         \x{100000}
  141:         Ket
  142:         End
  143: ------------------------------------------------------------------
  144: Capturing subpattern count = 0
  145: Options: utf
  146: First char = \x{dbc0}
  147: Need char = \x{dc00}
  148: 
  149: /\x{10ffff}/8DZ
  150: ------------------------------------------------------------------
  151:         Bra
  152:         \x{10ffff}
  153:         Ket
  154:         End
  155: ------------------------------------------------------------------
  156: Capturing subpattern count = 0
  157: Options: utf
  158: First char = \x{dbff}
  159: Need char = \x{dfff}
  160: 
  161: /[\x{ff}]/8DZ
  162: ------------------------------------------------------------------
  163:         Bra
  164:         \xff
  165:         Ket
  166:         End
  167: ------------------------------------------------------------------
  168: Capturing subpattern count = 0
  169: Options: utf
  170: First char = \x{ff}
  171: No need char
  172: 
  173: /[\x{100}]/8DZ
  174: ------------------------------------------------------------------
  175:         Bra
  176:         \x{100}
  177:         Ket
  178:         End
  179: ------------------------------------------------------------------
  180: Capturing subpattern count = 0
  181: Options: utf
  182: First char = \x{100}
  183: No need char
  184: 
  185: /\x80/8DZ
  186: ------------------------------------------------------------------
  187:         Bra
  188:         \x80
  189:         Ket
  190:         End
  191: ------------------------------------------------------------------
  192: Capturing subpattern count = 0
  193: Options: utf
  194: First char = \x{80}
  195: No need char
  196: 
  197: /\xff/8DZ
  198: ------------------------------------------------------------------
  199:         Bra
  200:         \xff
  201:         Ket
  202:         End
  203: ------------------------------------------------------------------
  204: Capturing subpattern count = 0
  205: Options: utf
  206: First char = \x{ff}
  207: No need char
  208: 
  209: /\x{D55c}\x{ad6d}\x{C5B4}/DZ8
  210: ------------------------------------------------------------------
  211:         Bra
  212:         \x{d55c}\x{ad6d}\x{c5b4}
  213:         Ket
  214:         End
  215: ------------------------------------------------------------------
  216: Capturing subpattern count = 0
  217: Options: utf
  218: First char = \x{d55c}
  219: Need char = \x{c5b4}
  220:     \x{D55c}\x{ad6d}\x{C5B4}
  221:  0: \x{d55c}\x{ad6d}\x{c5b4}
  222: 
  223: /\x{65e5}\x{672c}\x{8a9e}/DZ8
  224: ------------------------------------------------------------------
  225:         Bra
  226:         \x{65e5}\x{672c}\x{8a9e}
  227:         Ket
  228:         End
  229: ------------------------------------------------------------------
  230: Capturing subpattern count = 0
  231: Options: utf
  232: First char = \x{65e5}
  233: Need char = \x{8a9e}
  234:     \x{65e5}\x{672c}\x{8a9e}
  235:  0: \x{65e5}\x{672c}\x{8a9e}
  236: 
  237: /\x{80}/DZ8
  238: ------------------------------------------------------------------
  239:         Bra
  240:         \x80
  241:         Ket
  242:         End
  243: ------------------------------------------------------------------
  244: Capturing subpattern count = 0
  245: Options: utf
  246: First char = \x{80}
  247: No need char
  248: 
  249: /\x{084}/DZ8
  250: ------------------------------------------------------------------
  251:         Bra
  252:         \x84
  253:         Ket
  254:         End
  255: ------------------------------------------------------------------
  256: Capturing subpattern count = 0
  257: Options: utf
  258: First char = \x{84}
  259: No need char
  260: 
  261: /\x{104}/DZ8
  262: ------------------------------------------------------------------
  263:         Bra
  264:         \x{104}
  265:         Ket
  266:         End
  267: ------------------------------------------------------------------
  268: Capturing subpattern count = 0
  269: Options: utf
  270: First char = \x{104}
  271: No need char
  272: 
  273: /\x{861}/DZ8
  274: ------------------------------------------------------------------
  275:         Bra
  276:         \x{861}
  277:         Ket
  278:         End
  279: ------------------------------------------------------------------
  280: Capturing subpattern count = 0
  281: Options: utf
  282: First char = \x{861}
  283: No need char
  284: 
  285: /\x{212ab}/DZ8
  286: ------------------------------------------------------------------
  287:         Bra
  288:         \x{212ab}
  289:         Ket
  290:         End
  291: ------------------------------------------------------------------
  292: Capturing subpattern count = 0
  293: Options: utf
  294: First char = \x{d844}
  295: Need char = \x{deab}
  296: 
  297: /-- This one is here not because it's different to Perl, but because the way
  298: the captured single-byte is displayed. (In Perl it becomes a character, and you
  299: can't tell the difference.) --/
  300: 
  301: /X(\C)(.*)/8
  302:     X\x{1234}
  303:  0: X\x{1234}
  304:  1: \x{1234}
  305:  2: 
  306:     X\nabc
  307:  0: X\x{0a}abc
  308:  1: \x{0a}
  309:  2: abc
  310: 
  311: /-- This one is here because Perl gives out a grumbly error message (quite
  312: correctly, but that messes up comparisons). --/
  313: 
  314: /a\Cb/8
  315:     *** Failers
  316: No match
  317:     a\x{100}b
  318:  0: a\x{100}b
  319: 
  320: /[^ab\xC0-\xF0]/8SDZ
  321: ------------------------------------------------------------------
  322:         Bra
  323:         [\x00-`c-\xbf\xf1-\xff] (neg)
  324:         Ket
  325:         End
  326: ------------------------------------------------------------------
  327: Capturing subpattern count = 0
  328: Options: utf
  329: No first char
  330: No need char
  331: Subject length lower bound = 1
  332: Starting byte set: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x09 \x0a 
  333:   \x0b \x0c \x0d \x0e \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 
  334:   \x1a \x1b \x1c \x1d \x1e \x1f \x20 ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 
  335:   5 6 7 8 9 : ; < = > ? @ A B C D E F G H I J K L M N O P Q R S T U V W X Y 
  336:   Z [ \ ] ^ _ ` c d e f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f 
  337:   \x80 \x81 \x82 \x83 \x84 \x85 \x86 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e 
  338:   \x8f \x90 \x91 \x92 \x93 \x94 \x95 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d 
  339:   \x9e \x9f \xa0 \xa1 \xa2 \xa3 \xa4 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac 
  340:   \xad \xae \xaf \xb0 \xb1 \xb2 \xb3 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb 
  341:   \xbc \xbd \xbe \xbf \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb 
  342:   \xfc \xfd \xfe \xff 
  343:     \x{f1}
  344:  0: \x{f1}
  345:     \x{bf}
  346:  0: \x{bf}
  347:     \x{100}
  348:  0: \x{100}
  349:     \x{1000}
  350:  0: \x{1000}
  351:     *** Failers
  352:  0: *
  353:     \x{c0}
  354: No match
  355:     \x{f0}
  356: No match
  357: 
  358: /Ā{3,4}/8SDZ
  359: ------------------------------------------------------------------
  360:         Bra
  361:         \x{100}{3}
  362:         \x{100}?
  363:         Ket
  364:         End
  365: ------------------------------------------------------------------
  366: Capturing subpattern count = 0
  367: Options: utf
  368: First char = \x{100}
  369: Need char = \x{100}
  370: Subject length lower bound = 3
  371: No set of starting bytes
  372:   \x{100}\x{100}\x{100}\x{100\x{100}
  373:  0: \x{100}\x{100}\x{100}
  374: 
  375: /(\x{100}+|x)/8SDZ
  376: ------------------------------------------------------------------
  377:         Bra
  378:         CBra 1
  379:         \x{100}+
  380:         Alt
  381:         x
  382:         Ket
  383:         Ket
  384:         End
  385: ------------------------------------------------------------------
  386: Capturing subpattern count = 1
  387: Options: utf
  388: No first char
  389: No need char
  390: Subject length lower bound = 1
  391: Starting byte set: x \xff 
  392: 
  393: /(\x{100}*a|x)/8SDZ
  394: ------------------------------------------------------------------
  395:         Bra
  396:         CBra 1
  397:         \x{100}*+
  398:         a
  399:         Alt
  400:         x
  401:         Ket
  402:         Ket
  403:         End
  404: ------------------------------------------------------------------
  405: Capturing subpattern count = 1
  406: Options: utf
  407: No first char
  408: No need char
  409: Subject length lower bound = 1
  410: Starting byte set: a x \xff 
  411: 
  412: /(\x{100}{0,2}a|x)/8SDZ
  413: ------------------------------------------------------------------
  414:         Bra
  415:         CBra 1
  416:         \x{100}{0,2}
  417:         a
  418:         Alt
  419:         x
  420:         Ket
  421:         Ket
  422:         End
  423: ------------------------------------------------------------------
  424: Capturing subpattern count = 1
  425: Options: utf
  426: No first char
  427: No need char
  428: Subject length lower bound = 1
  429: Starting byte set: a x \xff 
  430: 
  431: /(\x{100}{1,2}a|x)/8SDZ
  432: ------------------------------------------------------------------
  433:         Bra
  434:         CBra 1
  435:         \x{100}
  436:         \x{100}{0,1}
  437:         a
  438:         Alt
  439:         x
  440:         Ket
  441:         Ket
  442:         End
  443: ------------------------------------------------------------------
  444: Capturing subpattern count = 1
  445: Options: utf
  446: No first char
  447: No need char
  448: Subject length lower bound = 1
  449: Starting byte set: x \xff 
  450: 
  451: /\x{100}/8DZ
  452: ------------------------------------------------------------------
  453:         Bra
  454:         \x{100}
  455:         Ket
  456:         End
  457: ------------------------------------------------------------------
  458: Capturing subpattern count = 0
  459: Options: utf
  460: First char = \x{100}
  461: No need char
  462: 
  463: /a\x{100}\x{101}*/8DZ
  464: ------------------------------------------------------------------
  465:         Bra
  466:         a\x{100}
  467:         \x{101}*
  468:         Ket
  469:         End
  470: ------------------------------------------------------------------
  471: Capturing subpattern count = 0
  472: Options: utf
  473: First char = 'a'
  474: Need char = \x{100}
  475: 
  476: /a\x{100}\x{101}+/8DZ
  477: ------------------------------------------------------------------
  478:         Bra
  479:         a\x{100}
  480:         \x{101}+
  481:         Ket
  482:         End
  483: ------------------------------------------------------------------
  484: Capturing subpattern count = 0
  485: Options: utf
  486: First char = 'a'
  487: Need char = \x{101}
  488: 
  489: /[^\x{c4}]/DZ
  490: ------------------------------------------------------------------
  491:         Bra
  492:         [^\xc4]
  493:         Ket
  494:         End
  495: ------------------------------------------------------------------
  496: Capturing subpattern count = 0
  497: No options
  498: No first char
  499: No need char
  500: 
  501: /[\x{100}]/8DZ
  502: ------------------------------------------------------------------
  503:         Bra
  504:         \x{100}
  505:         Ket
  506:         End
  507: ------------------------------------------------------------------
  508: Capturing subpattern count = 0
  509: Options: utf
  510: First char = \x{100}
  511: No need char
  512:     \x{100}
  513:  0: \x{100}
  514:     Z\x{100}
  515:  0: \x{100}
  516:     \x{100}Z
  517:  0: \x{100}
  518:     *** Failers
  519: No match
  520: 
  521: /[\xff]/DZ8
  522: ------------------------------------------------------------------
  523:         Bra
  524:         \xff
  525:         Ket
  526:         End
  527: ------------------------------------------------------------------
  528: Capturing subpattern count = 0
  529: Options: utf
  530: First char = \x{ff}
  531: No need char
  532:     >\x{ff}<
  533:  0: \x{ff}
  534: 
  535: /[^\xff]/8DZ
  536: ------------------------------------------------------------------
  537:         Bra
  538:         [^\xff]
  539:         Ket
  540:         End
  541: ------------------------------------------------------------------
  542: Capturing subpattern count = 0
  543: Options: utf
  544: No first char
  545: No need char
  546: 
  547: /\x{100}abc(xyz(?1))/8DZ
  548: ------------------------------------------------------------------
  549:         Bra
  550:         \x{100}abc
  551:         CBra 1
  552:         xyz
  553:         Recurse
  554:         Ket
  555:         Ket
  556:         End
  557: ------------------------------------------------------------------
  558: Capturing subpattern count = 1
  559: Options: utf
  560: First char = \x{100}
  561: Need char = 'z'
  562: 
  563: /\777/8I
  564: Capturing subpattern count = 0
  565: Options: utf
  566: First char = \x{1ff}
  567: No need char
  568:   \x{1ff}
  569:  0: \x{1ff}
  570:   \777
  571:  0: \x{1ff}
  572: 
  573: /\x{100}+\x{200}/8DZ
  574: ------------------------------------------------------------------
  575:         Bra
  576:         \x{100}++
  577:         \x{200}
  578:         Ket
  579:         End
  580: ------------------------------------------------------------------
  581: Capturing subpattern count = 0
  582: Options: utf
  583: First char = \x{100}
  584: Need char = \x{200}
  585: 
  586: /\x{100}+X/8DZ
  587: ------------------------------------------------------------------
  588:         Bra
  589:         \x{100}++
  590:         X
  591:         Ket
  592:         End
  593: ------------------------------------------------------------------
  594: Capturing subpattern count = 0
  595: Options: utf
  596: First char = \x{100}
  597: Need char = 'X'
  598: 
  599: /^[\QĀ\E-\QŐ\E/BZ8
  600: Failed: missing terminating ] for character class at offset 13
  601: 
  602: /X/8
  603:     \x{0}\x{d7ff}\x{e000}\x{10ffff}
  604: No match
  605:     \x{d800}
  606: Error -10 (bad UTF-16 string) offset=0 reason=1
  607:     \x{d800}\?
  608: No match
  609:     \x{da00}
  610: Error -10 (bad UTF-16 string) offset=0 reason=1
  611:     \x{da00}\?
  612: No match
  613:     \x{dc00}
  614: Error -10 (bad UTF-16 string) offset=0 reason=3
  615:     \x{dc00}\?
  616: No match
  617:     \x{de00}
  618: Error -10 (bad UTF-16 string) offset=0 reason=3
  619:     \x{de00}\?
  620: No match
  621:     \x{dfff}
  622: Error -10 (bad UTF-16 string) offset=0 reason=3
  623:     \x{dfff}\?
  624: No match
  625:     \x{110000}
  626: **Failed: character value greater than 0x10ffff cannot be converted to UTF-16
  627:     \x{d800}\x{1234}
  628: Error -10 (bad UTF-16 string) offset=1 reason=2
  629:     \x{fffe}
  630: Error -10 (bad UTF-16 string) offset=0 reason=4
  631: 
  632: /(*UTF16)\x{11234}/
  633:   abcd\x{11234}pqr
  634:  0: \x{11234}
  635: 
  636: /(*CRLF)(*UTF16)(*BSR_UNICODE)a\Rb/I
  637: Capturing subpattern count = 0
  638: Options: bsr_unicode utf
  639: Forced newline sequence: CRLF
  640: First char = 'a'
  641: Need char = 'b'
  642: 
  643: /\h/SI8
  644: Capturing subpattern count = 0
  645: Options: utf
  646: No first char
  647: No need char
  648: Subject length lower bound = 1
  649: Starting byte set: \x09 \x20 \xa0 \xff 
  650:     ABC\x{09}
  651:  0: \x{09}
  652:     ABC\x{20}
  653:  0:  
  654:     ABC\x{a0}
  655:  0: \x{a0}
  656:     ABC\x{1680}
  657:  0: \x{1680}
  658:     ABC\x{180e}
  659:  0: \x{180e}
  660:     ABC\x{2000}
  661:  0: \x{2000}
  662:     ABC\x{202f}
  663:  0: \x{202f}
  664:     ABC\x{205f}
  665:  0: \x{205f}
  666:     ABC\x{3000}
  667:  0: \x{3000}
  668: 
  669: /\v/SI8
  670: Capturing subpattern count = 0
  671: Options: utf
  672: No first char
  673: No need char
  674: Subject length lower bound = 1
  675: Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff 
  676:     ABC\x{0a}
  677:  0: \x{0a}
  678:     ABC\x{0b}
  679:  0: \x{0b}
  680:     ABC\x{0c}
  681:  0: \x{0c}
  682:     ABC\x{0d}
  683:  0: \x{0d}
  684:     ABC\x{85}
  685:  0: \x{85}
  686:     ABC\x{2028}
  687:  0: \x{2028}
  688: 
  689: /\h*A/SI8
  690: Capturing subpattern count = 0
  691: Options: utf
  692: No first char
  693: Need char = 'A'
  694: Subject length lower bound = 1
  695: Starting byte set: \x09 \x20 A \xa0 \xff 
  696:     CDBABC
  697:  0: A
  698:     \x{2000}ABC 
  699:  0: \x{2000}A
  700: 
  701: /\R*A/SI8
  702: Capturing subpattern count = 0
  703: Options: utf
  704: No first char
  705: Need char = 'A'
  706: Subject length lower bound = 1
  707: Starting byte set: \x0a \x0b \x0c \x0d A \x85 \xff 
  708:     CDBABC
  709:  0: A
  710:     \x{2028}A  
  711:  0: \x{2028}A
  712: 
  713: /\v+A/SI8
  714: Capturing subpattern count = 0
  715: Options: utf
  716: No first char
  717: Need char = 'A'
  718: Subject length lower bound = 2
  719: Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff 
  720: 
  721: /\s?xxx\s/8SI
  722: Capturing subpattern count = 0
  723: Options: utf
  724: No first char
  725: Need char = 'x'
  726: Subject length lower bound = 4
  727: Starting byte set: \x09 \x0a \x0c \x0d \x20 x 
  728: 
  729: /\sxxx\s/I8ST1
  730: Capturing subpattern count = 0
  731: Options: utf
  732: No first char
  733: Need char = 'x'
  734: Subject length lower bound = 5
  735: Starting byte set: \x09 \x0a \x0c \x0d \x20 \x85 \xa0 
  736:     AB\x{85}xxx\x{a0}XYZ
  737:  0: \x{85}xxx\x{a0}
  738:     AB\x{a0}xxx\x{85}XYZ
  739:  0: \x{a0}xxx\x{85}
  740: 
  741: /\S \S/I8ST1
  742: Capturing subpattern count = 0
  743: Options: utf
  744: No first char
  745: Need char = ' '
  746: Subject length lower bound = 3
  747: Starting byte set: \x00 \x01 \x02 \x03 \x04 \x05 \x06 \x07 \x08 \x0b \x0e 
  748:   \x0f \x10 \x11 \x12 \x13 \x14 \x15 \x16 \x17 \x18 \x19 \x1a \x1b \x1c \x1d 
  749:   \x1e \x1f ! " # $ % & ' ( ) * + , - . / 0 1 2 3 4 5 6 7 8 9 : ; < = > ? @ 
  750:   A B C D E F G H I J K L M N O P Q R S T U V W X Y Z [ \ ] ^ _ ` a b c d e 
  751:   f g h i j k l m n o p q r s t u v w x y z { | } ~ \x7f \x80 \x81 \x82 \x83 
  752:   \x84 \x86 \x87 \x88 \x89 \x8a \x8b \x8c \x8d \x8e \x8f \x90 \x91 \x92 \x93 
  753:   \x94 \x95 \x96 \x97 \x98 \x99 \x9a \x9b \x9c \x9d \x9e \x9f \xa1 \xa2 \xa3 
  754:   \xa4 \xa5 \xa6 \xa7 \xa8 \xa9 \xaa \xab \xac \xad \xae \xaf \xb0 \xb1 \xb2 
  755:   \xb3 \xb4 \xb5 \xb6 \xb7 \xb8 \xb9 \xba \xbb \xbc \xbd \xbe \xbf \xc0 \xc1 
  756:   \xc2 \xc3 \xc4 \xc5 \xc6 \xc7 \xc8 \xc9 \xca \xcb \xcc \xcd \xce \xcf \xd0 
  757:   \xd1 \xd2 \xd3 \xd4 \xd5 \xd6 \xd7 \xd8 \xd9 \xda \xdb \xdc \xdd \xde \xdf 
  758:   \xe0 \xe1 \xe2 \xe3 \xe4 \xe5 \xe6 \xe7 \xe8 \xe9 \xea \xeb \xec \xed \xee 
  759:   \xef \xf0 \xf1 \xf2 \xf3 \xf4 \xf5 \xf6 \xf7 \xf8 \xf9 \xfa \xfb \xfc \xfd 
  760:   \xfe \xff 
  761:     \x{a2} \x{84}
  762:  0: \x{a2} \x{84}
  763:     A Z
  764:  0: A Z
  765: 
  766: /a+/8
  767:     a\x{123}aa\>1
  768:  0: aa
  769:     a\x{123}aa\>2
  770:  0: aa
  771:     a\x{123}aa\>3
  772:  0: a
  773:     a\x{123}aa\>4
  774: No match
  775:     a\x{123}aa\>5
  776: Error -24 (bad offset value)
  777:     a\x{123}aa\>6
  778: Error -24 (bad offset value)
  779: 
  780: /\x{1234}+/iS8I
  781: Capturing subpattern count = 0
  782: Options: caseless utf
  783: First char = \x{1234}
  784: No need char
  785: Subject length lower bound = 1
  786: No set of starting bytes
  787: 
  788: /\x{1234}+?/iS8I
  789: Capturing subpattern count = 0
  790: Options: caseless utf
  791: First char = \x{1234}
  792: No need char
  793: Subject length lower bound = 1
  794: No set of starting bytes
  795: 
  796: /\x{1234}++/iS8I
  797: Capturing subpattern count = 0
  798: Options: caseless utf
  799: First char = \x{1234}
  800: No need char
  801: Subject length lower bound = 1
  802: No set of starting bytes
  803: 
  804: /\x{1234}{2}/iS8I
  805: Capturing subpattern count = 0
  806: Options: caseless utf
  807: First char = \x{1234}
  808: Need char = \x{1234}
  809: Subject length lower bound = 2
  810: No set of starting bytes
  811: 
  812: /[^\x{c4}]/8DZ
  813: ------------------------------------------------------------------
  814:         Bra
  815:         [^\xc4]
  816:         Ket
  817:         End
  818: ------------------------------------------------------------------
  819: Capturing subpattern count = 0
  820: Options: utf
  821: No first char
  822: No need char
  823: 
  824: /X+\x{200}/8DZ
  825: ------------------------------------------------------------------
  826:         Bra
  827:         X++
  828:         \x{200}
  829:         Ket
  830:         End
  831: ------------------------------------------------------------------
  832: Capturing subpattern count = 0
  833: Options: utf
  834: First char = 'X'
  835: Need char = \x{200}
  836: 
  837: /\R/SI8
  838: Capturing subpattern count = 0
  839: Options: utf
  840: No first char
  841: No need char
  842: Subject length lower bound = 1
  843: Starting byte set: \x0a \x0b \x0c \x0d \x85 \xff 
  844: 
  845: /-- Check bad offset --/
  846: 
  847: /a/8
  848:     \x{10000}\>1
  849: Error -11 (bad UTF-16 offset)
  850:     \x{10000}ab\>2
  851:  0: a
  852:     \x{10000}ab\>3
  853: No match
  854:     \x{10000}ab\>4
  855: No match
  856:     \x{10000}ab\>5
  857: Error -24 (bad offset value)
  858: 
  859: //8
  860: Failed: invalid UTF-16 string at offset 0
  861: 
  862: /\w+\x{C4}/8BZ
  863: ------------------------------------------------------------------
  864:         Bra
  865:         \w++
  866:         \xc4
  867:         Ket
  868:         End
  869: ------------------------------------------------------------------
  870:     a\x{C4}\x{C4}
  871:  0: a\x{c4}
  872: 
  873: /\w+\x{C4}/8BZT1
  874: ------------------------------------------------------------------
  875:         Bra
  876:         \w+
  877:         \xc4
  878:         Ket
  879:         End
  880: ------------------------------------------------------------------
  881:     a\x{C4}\x{C4}
  882:  0: a\x{c4}\x{c4}
  883:     
  884: /\W+\x{C4}/8BZ
  885: ------------------------------------------------------------------
  886:         Bra
  887:         \W+
  888:         \xc4
  889:         Ket
  890:         End
  891: ------------------------------------------------------------------
  892:     !\x{C4}
  893:  0: !\x{c4}
  894:  
  895: /\W+\x{C4}/8BZT1
  896: ------------------------------------------------------------------
  897:         Bra
  898:         \W++
  899:         \xc4
  900:         Ket
  901:         End
  902: ------------------------------------------------------------------
  903:     !\x{C4}
  904:  0: !\x{c4}
  905: 
  906: /\W+\x{A1}/8BZ
  907: ------------------------------------------------------------------
  908:         Bra
  909:         \W+
  910:         \xa1
  911:         Ket
  912:         End
  913: ------------------------------------------------------------------
  914:     !\x{A1}
  915:  0: !\x{a1}
  916:  
  917: /\W+\x{A1}/8BZT1
  918: ------------------------------------------------------------------
  919:         Bra
  920:         \W+
  921:         \xa1
  922:         Ket
  923:         End
  924: ------------------------------------------------------------------
  925:     !\x{A1}
  926:  0: !\x{a1}
  927: 
  928: /X\s+\x{A0}/8BZ
  929: ------------------------------------------------------------------
  930:         Bra
  931:         X
  932:         \s++
  933:         \xa0
  934:         Ket
  935:         End
  936: ------------------------------------------------------------------
  937:     X\x20\x{A0}\x{A0}
  938:  0: X \x{a0}
  939: 
  940: /X\s+\x{A0}/8BZT1
  941: ------------------------------------------------------------------
  942:         Bra
  943:         X
  944:         \s+
  945:         \xa0
  946:         Ket
  947:         End
  948: ------------------------------------------------------------------
  949:     X\x20\x{A0}\x{A0}
  950:  0: X \x{a0}\x{a0}
  951: 
  952: /\S+\x{A0}/8BZ
  953: ------------------------------------------------------------------
  954:         Bra
  955:         \S+
  956:         \xa0
  957:         Ket
  958:         End
  959: ------------------------------------------------------------------
  960:     X\x{A0}\x{A0}
  961:  0: X\x{a0}\x{a0}
  962: 
  963: /\S+\x{A0}/8BZT1
  964: ------------------------------------------------------------------
  965:         Bra
  966:         \S++
  967:         \xa0
  968:         Ket
  969:         End
  970: ------------------------------------------------------------------
  971:     X\x{A0}\x{A0}
  972:  0: X\x{a0}
  973: 
  974: /\x{a0}+\s!/8BZ
  975: ------------------------------------------------------------------
  976:         Bra
  977:         \xa0++
  978:         \s
  979:         !
  980:         Ket
  981:         End
  982: ------------------------------------------------------------------
  983:     \x{a0}\x20!
  984:  0: \x{a0} !
  985: 
  986: /\x{a0}+\s!/8BZT1
  987: ------------------------------------------------------------------
  988:         Bra
  989:         \xa0+
  990:         \s
  991:         !
  992:         Ket
  993:         End
  994: ------------------------------------------------------------------
  995:     \x{a0}\x20!
  996:  0: \x{a0} !
  997: 
  998: /-- End of testinput18 --/

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>