mirror of
https://github.com/urbit/shrub.git
synced 2024-12-18 07:42:20 +03:00
389 lines
30 KiB
HTML
389 lines
30 KiB
HTML
|
<html>
|
||
|
<!-- AUTOMATICALLY GENERATED by mksyntaxhtml -->
|
||
|
<head>
|
||
|
<meta http-equiv="Content-Type" content="text/html; charset=UTF-8"/>
|
||
|
<title>RE2 regular expression syntax reference</title>
|
||
|
</head>
|
||
|
<body>
|
||
|
<h1>RE2 regular expression syntax reference</h1>
|
||
|
|
||
|
<table border=0 cellpadding=2 cellspacing=2>
|
||
|
<tr><td colspan=2>This page lists the regular expression syntax accepted by RE2.</td></tr>
|
||
|
<tr><td colspan=2>It also lists syntax accepted by PCRE, PERL, and VIM.</td></tr>
|
||
|
<tr><td colspan=2>Grayed out expressions are not supported by RE2.</td></tr>
|
||
|
<tr><td colspan=2>See <a href="http://go/re2">http://go/re2</a> and <a href="http://go/re2quick">http://go/re2quick</a>.</td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Single characters:</b></td></tr>
|
||
|
<tr><td><code>.</code></td><td>any character, including newline (s=true)</td></tr>
|
||
|
<tr><td><code>[xyz]</code></td><td>character class</td></tr>
|
||
|
<tr><td><code>[^xyz]</code></td><td>negated character class</td></tr>
|
||
|
<tr><td><code>\d</code></td><td>Perl character class</td></tr>
|
||
|
<tr><td><code>\D</code></td><td>negated Perl character class</td></tr>
|
||
|
<tr><td><code>[:alpha:]</code></td><td>ASCII character class</td></tr>
|
||
|
<tr><td><code>[:^alpha:]</code></td><td>negated ASCII character class</td></tr>
|
||
|
<tr><td><code>\pN</code></td><td>Unicode character class (one-letter name)</td></tr>
|
||
|
<tr><td><code>\p{Greek}</code></td><td>Unicode character class</td></tr>
|
||
|
<tr><td><code>\PN</code></td><td>negated Unicode character class (one-letter name)</td></tr>
|
||
|
<tr><td><code>\P{Greek}</code></td><td>negated Unicode character class</td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Composites:</b></td></tr>
|
||
|
<tr><td><code>xy</code></td><td><code>x</code> followed by <code>y</code></td></tr>
|
||
|
<tr><td><code>x|y</code></td><td><code>x</code> or <code>y</code> (prefer <code>x</code>)</td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Repetitions:</b></td></tr>
|
||
|
<tr><td><code>x*</code></td><td>zero or more <code>x</code>, prefer more</td></tr>
|
||
|
<tr><td><code>x+</code></td><td>one or more <code>x</code>, prefer more</td></tr>
|
||
|
<tr><td><code>x?</code></td><td>zero or one <code>x</code>, prefer one</td></tr>
|
||
|
<tr><td><code>x{n,m}</code></td><td><code>n</code> or <code>n</code>+1 or ... or <code>m</code> <code>x</code>, prefer more</td></tr>
|
||
|
<tr><td><code>x{n,}</code></td><td><code>n</code> or more <code>x</code>, prefer more</td></tr>
|
||
|
<tr><td><code>x{n}</code></td><td>exactly <code>n</code> <code>x</code></td></tr>
|
||
|
<tr><td><code>x*?</code></td><td>zero or more <code>x</code>, prefer fewer</td></tr>
|
||
|
<tr><td><code>x+?</code></td><td>one or more <code>x</code>, prefer fewer</td></tr>
|
||
|
<tr><td><code>x??</code></td><td>zero or one <code>x</code>, prefer zero</td></tr>
|
||
|
<tr><td><code>x{n,m}?</code></td><td><code>n</code> or <code>n</code>+1 or ... or <code>m</code> <code>x</code>, prefer fewer</td></tr>
|
||
|
<tr><td><code>x{n,}?</code></td><td><code>n</code> or more <code>x</code>, prefer fewer</td></tr>
|
||
|
<tr><td><code>x{n}?</code></td><td>exactly <code>n</code> <code>x</code></td></tr>
|
||
|
<tr><td><code><font color=#808080>x{}</font></code></td><td>(≡ <code>x*</code>) <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>x{-}</font></code></td><td>(≡ <code>x*?</code>) <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>x{-n}</font></code></td><td>(≡ <code>x{n}?</code>) <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>x=</font></code></td><td>(≡ <code>x?</code>) <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Possessive repetitions:</b></td></tr>
|
||
|
<tr><td><code><font color=#808080>x*+</font></code></td><td>zero or more <code>x</code>, possessive </td></tr>
|
||
|
<tr><td><code><font color=#808080>x++</font></code></td><td>one or more <code>x</code>, possessive </td></tr>
|
||
|
<tr><td><code><font color=#808080>x?+</font></code></td><td>zero or one <code>x</code>, possessive </td></tr>
|
||
|
<tr><td><code><font color=#808080>x{n,m}+</font></code></td><td><code>n</code> or ... or <code>m</code> <code>x</code>, possessive </td></tr>
|
||
|
<tr><td><code><font color=#808080>x{n,}+</font></code></td><td><code>n</code> or more <code>x</code>, possessive </td></tr>
|
||
|
<tr><td><code><font color=#808080>x{n}+</font></code></td><td>exactly <code>n</code> <code>x</code>, possessive </td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Grouping:</b></td></tr>
|
||
|
<tr><td><code>(re)</code></td><td>numbered capturing group</td></tr>
|
||
|
<tr><td><code>(?P<name>re)</code></td><td>named & numbered capturing group</td></tr>
|
||
|
<tr><td><code><font color=#808080>(?<name>re)</font></code></td><td>named & numbered capturing group </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?'name're)</font></code></td><td>named & numbered capturing group </td></tr>
|
||
|
<tr><td><code>(?:re)</code></td><td>non-capturing group</td></tr>
|
||
|
<tr><td><code>(?flags)</code></td><td>set flags until outer paren closes; non-capturing</td></tr>
|
||
|
<tr><td><code>(?flags:re)</code></td><td>set flags during re; non-capturing</td></tr>
|
||
|
<tr><td><code><font color=#808080>(?#text)</font></code></td><td>comment </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?|x|y|z)</font></code></td><td>branch numbering reset </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?>re)</font></code></td><td>possessive match of <code>re</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>re@></font></code></td><td>possessive match of <code>re</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>%(re)</font></code></td><td>non-capturing group <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Flags:</b></td></tr>
|
||
|
<tr><td><code>i</code></td><td>case-insensitive (default false)</td></tr>
|
||
|
<tr><td><code>m</code></td><td>multi-line mode (default false)</td></tr>
|
||
|
<tr><td><code>s</code></td><td>let <code>.</code> match <code>\n</code> (default false)</td></tr>
|
||
|
<tr><td><code>U</code></td><td>ungreedy: swap meaning of <code>x*</code> and <code>x*?</code>, <code>x+</code> and <code>x+?</code>, etc (default false)</td></tr>
|
||
|
<tr><td colspan=2>Flag syntax is <code>xyz</code> (set) or <code>-xyz</code> (clear) or <code>xy-z</code> (set <code>xy</code>, clear <code>z</code>).</td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Empty strings:</b></td></tr>
|
||
|
<tr><td><code>^</code></td><td>at beginning of text or line (<code>m</code>=true)</td></tr>
|
||
|
<tr><td><code>$</code></td><td>at end of text or line (<code>m</code>=true)</td></tr>
|
||
|
<tr><td><code>\A</code></td><td>at beginning of text</td></tr>
|
||
|
<tr><td><code>\b</code></td><td>at word boundary (<code>\w</code> to left and <code>\W</code> to right or vice versa)</td></tr>
|
||
|
<tr><td><code>\B</code></td><td>not a word boundary</td></tr>
|
||
|
<tr><td><code><font color=#808080>\G</font></code></td><td>at beginning of subtext being searched <font size=-2>PCRE</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\G</font></code></td><td>at end of last match <font size=-2>PERL</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\Z</font></code></td><td>at end of text, or before newline at end of text </td></tr>
|
||
|
<tr><td><code>\z</code></td><td>at end of text</td></tr>
|
||
|
<tr><td><code><font color=#808080>(?=re)</font></code></td><td>before text matching <code>re</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?!re)</font></code></td><td>before text not matching <code>re</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?<=re)</font></code></td><td>after text matching <code>re</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?<!re)</font></code></td><td>after text not matching <code>re</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>re&</font></code></td><td>before text matching <code>re</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>re@=</font></code></td><td>before text matching <code>re</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>re@!</font></code></td><td>before text not matching <code>re</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>re@<=</font></code></td><td>after text matching <code>re</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>re@<!</font></code></td><td>after text not matching <code>re</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\zs</font></code></td><td>sets start of match (= \K) <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\ze</font></code></td><td>sets end of match <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%^</font></code></td><td>beginning of file <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%$</font></code></td><td>end of file <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%V</font></code></td><td>on screen <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%#</font></code></td><td>cursor position <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%'m</font></code></td><td>mark <code>m</code> position <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%23l</font></code></td><td>in line 23 <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%23c</font></code></td><td>in column 23 <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%23v</font></code></td><td>in virtual column 23 <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Escape sequences:</b></td></tr>
|
||
|
<tr><td><code>\a</code></td><td>bell (≡ <code>\007</code>)</td></tr>
|
||
|
<tr><td><code>\f</code></td><td>form feed (≡ <code>\014</code>)</td></tr>
|
||
|
<tr><td><code>\t</code></td><td>horizontal tab (≡ <code>\011</code>)</td></tr>
|
||
|
<tr><td><code>\n</code></td><td>newline (≡ <code>\012</code>)</td></tr>
|
||
|
<tr><td><code>\r</code></td><td>carriage return (≡ <code>\015</code>)</td></tr>
|
||
|
<tr><td><code>\v</code></td><td>vertical tab character (≡ <code>\013</code>)</td></tr>
|
||
|
<tr><td><code>\*</code></td><td>literal <code>*</code>, for any punctuation character <code>*</code></td></tr>
|
||
|
<tr><td><code>\123</code></td><td>octal character code (up to three digits)</td></tr>
|
||
|
<tr><td><code>\x7F</code></td><td>hex character code (exactly two digits)</td></tr>
|
||
|
<tr><td><code>\x{10FFFF}</code></td><td>hex character code</td></tr>
|
||
|
<tr><td><code>\C</code></td><td>match a single byte even in UTF-8 mode</td></tr>
|
||
|
<tr><td><code>\Q...\E</code></td><td>literal text <code>...</code> even if <code>...</code> has punctuation</td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>\1</font></code></td><td>backreference </td></tr>
|
||
|
<tr><td><code><font color=#808080>\b</font></code></td><td>backspace (use <code>\010</code>)</td></tr>
|
||
|
<tr><td><code><font color=#808080>\cK</font></code></td><td>control char ^K (use <code>\001</code> etc)</td></tr>
|
||
|
<tr><td><code><font color=#808080>\e</font></code></td><td>escape (use <code>\033</code>)</td></tr>
|
||
|
<tr><td><code><font color=#808080>\g1</font></code></td><td>backreference </td></tr>
|
||
|
<tr><td><code><font color=#808080>\g{1}</font></code></td><td>backreference </td></tr>
|
||
|
<tr><td><code><font color=#808080>\g{+1}</font></code></td><td>backreference </td></tr>
|
||
|
<tr><td><code><font color=#808080>\g{-1}</font></code></td><td>backreference </td></tr>
|
||
|
<tr><td><code><font color=#808080>\g{name}</font></code></td><td>named backreference </td></tr>
|
||
|
<tr><td><code><font color=#808080>\g<name></font></code></td><td>subroutine call </td></tr>
|
||
|
<tr><td><code><font color=#808080>\g'name'</font></code></td><td>subroutine call </td></tr>
|
||
|
<tr><td><code><font color=#808080>\k<name></font></code></td><td>named backreference </td></tr>
|
||
|
<tr><td><code><font color=#808080>\k'name'</font></code></td><td>named backreference </td></tr>
|
||
|
<tr><td><code><font color=#808080>\lX</font></code></td><td>lowercase <code>X</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>\ux</font></code></td><td>uppercase <code>x</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>\L...\E</font></code></td><td>lowercase text <code>...</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>\K</font></code></td><td>reset beginning of <code>$0</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>\N{name}</font></code></td><td>named Unicode character </td></tr>
|
||
|
<tr><td><code><font color=#808080>\R</font></code></td><td>line break </td></tr>
|
||
|
<tr><td><code><font color=#808080>\U...\E</font></code></td><td>upper case text <code>...</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>\X</font></code></td><td>extended Unicode sequence </td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%d123</font></code></td><td>decimal character 123 <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%xFF</font></code></td><td>hex character FF <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%o123</font></code></td><td>octal character 123 <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%u1234</font></code></td><td>Unicode character 0x1234 <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\%U12345678</font></code></td><td>Unicode character 0x12345678 <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Character class elements:</b></td></tr>
|
||
|
<tr><td><code>x</code></td><td>single character</td></tr>
|
||
|
<tr><td><code>A-Z</code></td><td>character range (inclusive)</td></tr>
|
||
|
<tr><td><code>\d</code></td><td>Perl character class</td></tr>
|
||
|
<tr><td><code>[:foo:]</code></td><td>ASCII character class <code>foo</code></td></tr>
|
||
|
<tr><td><code>\p{Foo}</code></td><td>Unicode character class <code>Foo</code></td></tr>
|
||
|
<tr><td><code>\pF</code></td><td>Unicode character class <code>F</code> (one-letter name)</td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Named character classes as character class elements:</b></td></tr>
|
||
|
<tr><td><code>[\d]</code></td><td>digits (≡ <code>\d</code>)</td></tr>
|
||
|
<tr><td><code>[^\d]</code></td><td>not digits (≡ <code>\D</code>)</td></tr>
|
||
|
<tr><td><code>[\D]</code></td><td>not digits (≡ <code>\D</code>)</td></tr>
|
||
|
<tr><td><code>[^\D]</code></td><td>not not digits (≡ <code>\d</code>)</td></tr>
|
||
|
<tr><td><code>[[:name:]]</code></td><td>named ASCII class inside character class (≡ <code>[:name:]</code>)</td></tr>
|
||
|
<tr><td><code>[^[:name:]]</code></td><td>named ASCII class inside negated character class (≡ <code>[:^name:]</code>)</td></tr>
|
||
|
<tr><td><code>[\p{Name}]</code></td><td>named Unicode property inside character class (≡ <code>\p{Name}</code>)</td></tr>
|
||
|
<tr><td><code>[^\p{Name}]</code></td><td>named Unicode property inside negated character class (≡ <code>\P{Name}</code>)</td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Perl character classes:</b></td></tr>
|
||
|
<tr><td><code>\d</code></td><td>digits (≡ <code>[0-9]</code>)</td></tr>
|
||
|
<tr><td><code>\D</code></td><td>not digits (≡ <code>[^0-9]</code>)</td></tr>
|
||
|
<tr><td><code>\s</code></td><td>whitespace (≡ <code>[\t\n\f\r ]</code>)</td></tr>
|
||
|
<tr><td><code>\S</code></td><td>not whitespace (≡ <code>[^\t\n\f\r ]</code>)</td></tr>
|
||
|
<tr><td><code>\w</code></td><td>word characters (≡ <code>[0-9A-Za-z_]</code>)</td></tr>
|
||
|
<tr><td><code>\W</code></td><td>not word characters (≡ <code>[^0-9A-Za-z_]</code>)</td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>\h</font></code></td><td>horizontal space </td></tr>
|
||
|
<tr><td><code><font color=#808080>\H</font></code></td><td>not horizontal space </td></tr>
|
||
|
<tr><td><code><font color=#808080>\v</font></code></td><td>vertical space </td></tr>
|
||
|
<tr><td><code><font color=#808080>\V</font></code></td><td>not vertical space </td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>ASCII character classes:</b></td></tr>
|
||
|
<tr><td><code>[:alnum:]</code></td><td>alphanumeric (≡ <code>[0-9A-Za-z]</code>)</td></tr>
|
||
|
<tr><td><code>[:alpha:]</code></td><td>alphabetic (≡ <code>[A-Za-z]</code>)</td></tr>
|
||
|
<tr><td><code>[:ascii:]</code></td><td>ASCII (≡ <code>[\x00-\x7F]</code>)</td></tr>
|
||
|
<tr><td><code>[:blank:]</code></td><td>blank (≡ <code>[\t ]</code>)</td></tr>
|
||
|
<tr><td><code>[:cntrl:]</code></td><td>control (≡ <code>[\x00-\x1F\x7F]</code>)</td></tr>
|
||
|
<tr><td><code>[:digit:]</code></td><td>digits (≡ <code>[0-9]</code>)</td></tr>
|
||
|
<tr><td><code>[:graph:]</code></td><td>graphical (≡ <code>[!-~] == [A-Za-z0-9!"#$%&'()*+,\-./:;<=>?@[\\\]^_`{|}~]</code>)</td></tr>
|
||
|
<tr><td><code>[:lower:]</code></td><td>lower case (≡ <code>[a-z]</code>)</td></tr>
|
||
|
<tr><td><code>[:print:]</code></td><td>printable (≡ <code>[ -~] == [ [:graph:]]</code>)</td></tr>
|
||
|
<tr><td><code>[:punct:]</code></td><td>punctuation (≡ <code>[!-/:-@[-`{-~]</code>)</td></tr>
|
||
|
<tr><td><code>[:space:]</code></td><td>whitespace (≡ <code>[\t\n\v\f\r ]</code>)</td></tr>
|
||
|
<tr><td><code>[:upper:]</code></td><td>upper case (≡ <code>[A-Z]</code>)</td></tr>
|
||
|
<tr><td><code>[:word:]</code></td><td>word characters (≡ <code>[0-9A-Za-z_]</code>)</td></tr>
|
||
|
<tr><td><code>[:xdigit:]</code></td><td>hex digit (≡ <code>[0-9A-Fa-f]</code>)</td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Unicode character class names--general category:</b></td></tr>
|
||
|
<tr><td><code>C</code></td><td>other</td></tr>
|
||
|
<tr><td><code>Cc</code></td><td>control</td></tr>
|
||
|
<tr><td><code>Cf</code></td><td>format</td></tr>
|
||
|
<tr><td><code><font color=#808080>Cn</font></code></td><td>unassigned code points </td></tr>
|
||
|
<tr><td><code>Co</code></td><td>private use</td></tr>
|
||
|
<tr><td><code>Cs</code></td><td>surrogate</td></tr>
|
||
|
<tr><td><code>L</code></td><td>letter</td></tr>
|
||
|
<tr><td><code><font color=#808080>LC</font></code></td><td>cased letter </td></tr>
|
||
|
<tr><td><code><font color=#808080>L&</font></code></td><td>cased letter </td></tr>
|
||
|
<tr><td><code>Ll</code></td><td>lowercase letter</td></tr>
|
||
|
<tr><td><code>Lm</code></td><td>modifier letter</td></tr>
|
||
|
<tr><td><code>Lo</code></td><td>other letter</td></tr>
|
||
|
<tr><td><code>Lt</code></td><td>titlecase letter</td></tr>
|
||
|
<tr><td><code>Lu</code></td><td>uppercase letter</td></tr>
|
||
|
<tr><td><code>M</code></td><td>mark</td></tr>
|
||
|
<tr><td><code>Mc</code></td><td>spacing mark</td></tr>
|
||
|
<tr><td><code>Me</code></td><td>enclosing mark</td></tr>
|
||
|
<tr><td><code>Mn</code></td><td>non-spacing mark</td></tr>
|
||
|
<tr><td><code>N</code></td><td>number</td></tr>
|
||
|
<tr><td><code>Nd</code></td><td>decimal number</td></tr>
|
||
|
<tr><td><code>Nl</code></td><td>letter number</td></tr>
|
||
|
<tr><td><code>No</code></td><td>other number</td></tr>
|
||
|
<tr><td><code>P</code></td><td>punctuation</td></tr>
|
||
|
<tr><td><code>Pc</code></td><td>connector punctuation</td></tr>
|
||
|
<tr><td><code>Pd</code></td><td>dash punctuation</td></tr>
|
||
|
<tr><td><code>Pe</code></td><td>close punctuation</td></tr>
|
||
|
<tr><td><code>Pf</code></td><td>final punctuation</td></tr>
|
||
|
<tr><td><code>Pi</code></td><td>initial punctuation</td></tr>
|
||
|
<tr><td><code>Po</code></td><td>other punctuation</td></tr>
|
||
|
<tr><td><code>Ps</code></td><td>open punctuation</td></tr>
|
||
|
<tr><td><code>S</code></td><td>symbol</td></tr>
|
||
|
<tr><td><code>Sc</code></td><td>currency symbol</td></tr>
|
||
|
<tr><td><code>Sk</code></td><td>modifier symbol</td></tr>
|
||
|
<tr><td><code>Sm</code></td><td>math symbol</td></tr>
|
||
|
<tr><td><code>So</code></td><td>other symbol</td></tr>
|
||
|
<tr><td><code>Z</code></td><td>separator</td></tr>
|
||
|
<tr><td><code>Zl</code></td><td>line separator</td></tr>
|
||
|
<tr><td><code>Zp</code></td><td>paragraph separator</td></tr>
|
||
|
<tr><td><code>Zs</code></td><td>space separator</td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Unicode character class names--scripts:</b></td></tr>
|
||
|
<tr><td><code>Arabic</code></td><td>Arabic</td></tr>
|
||
|
<tr><td><code>Armenian</code></td><td>Armenian</td></tr>
|
||
|
<tr><td><code>Balinese</code></td><td>Balinese</td></tr>
|
||
|
<tr><td><code>Bengali</code></td><td>Bengali</td></tr>
|
||
|
<tr><td><code>Bopomofo</code></td><td>Bopomofo</td></tr>
|
||
|
<tr><td><code>Braille</code></td><td>Braille</td></tr>
|
||
|
<tr><td><code>Buginese</code></td><td>Buginese</td></tr>
|
||
|
<tr><td><code>Buhid</code></td><td>Buhid</td></tr>
|
||
|
<tr><td><code>Canadian_Aboriginal</code></td><td>Canadian Aboriginal</td></tr>
|
||
|
<tr><td><code>Carian</code></td><td>Carian</td></tr>
|
||
|
<tr><td><code>Cham</code></td><td>Cham</td></tr>
|
||
|
<tr><td><code>Cherokee</code></td><td>Cherokee</td></tr>
|
||
|
<tr><td><code>Common</code></td><td>characters not specific to one script</td></tr>
|
||
|
<tr><td><code>Coptic</code></td><td>Coptic</td></tr>
|
||
|
<tr><td><code>Cuneiform</code></td><td>Cuneiform</td></tr>
|
||
|
<tr><td><code>Cypriot</code></td><td>Cypriot</td></tr>
|
||
|
<tr><td><code>Cyrillic</code></td><td>Cyrillic</td></tr>
|
||
|
<tr><td><code>Deseret</code></td><td>Deseret</td></tr>
|
||
|
<tr><td><code>Devanagari</code></td><td>Devanagari</td></tr>
|
||
|
<tr><td><code>Ethiopic</code></td><td>Ethiopic</td></tr>
|
||
|
<tr><td><code>Georgian</code></td><td>Georgian</td></tr>
|
||
|
<tr><td><code>Glagolitic</code></td><td>Glagolitic</td></tr>
|
||
|
<tr><td><code>Gothic</code></td><td>Gothic</td></tr>
|
||
|
<tr><td><code>Greek</code></td><td>Greek</td></tr>
|
||
|
<tr><td><code>Gujarati</code></td><td>Gujarati</td></tr>
|
||
|
<tr><td><code>Gurmukhi</code></td><td>Gurmukhi</td></tr>
|
||
|
<tr><td><code>Han</code></td><td>Han</td></tr>
|
||
|
<tr><td><code>Hangul</code></td><td>Hangul</td></tr>
|
||
|
<tr><td><code>Hanunoo</code></td><td>Hanunoo</td></tr>
|
||
|
<tr><td><code>Hebrew</code></td><td>Hebrew</td></tr>
|
||
|
<tr><td><code>Hiragana</code></td><td>Hiragana</td></tr>
|
||
|
<tr><td><code>Inherited</code></td><td>inherit script from previous character</td></tr>
|
||
|
<tr><td><code>Kannada</code></td><td>Kannada</td></tr>
|
||
|
<tr><td><code>Katakana</code></td><td>Katakana</td></tr>
|
||
|
<tr><td><code>Kayah_Li</code></td><td>Kayah Li</td></tr>
|
||
|
<tr><td><code>Kharoshthi</code></td><td>Kharoshthi</td></tr>
|
||
|
<tr><td><code>Khmer</code></td><td>Khmer</td></tr>
|
||
|
<tr><td><code>Lao</code></td><td>Lao</td></tr>
|
||
|
<tr><td><code>Latin</code></td><td>Latin</td></tr>
|
||
|
<tr><td><code>Lepcha</code></td><td>Lepcha</td></tr>
|
||
|
<tr><td><code>Limbu</code></td><td>Limbu</td></tr>
|
||
|
<tr><td><code>Linear_B</code></td><td>Linear B</td></tr>
|
||
|
<tr><td><code>Lycian</code></td><td>Lycian</td></tr>
|
||
|
<tr><td><code>Lydian</code></td><td>Lydian</td></tr>
|
||
|
<tr><td><code>Malayalam</code></td><td>Malayalam</td></tr>
|
||
|
<tr><td><code>Mongolian</code></td><td>Mongolian</td></tr>
|
||
|
<tr><td><code>Myanmar</code></td><td>Myanmar</td></tr>
|
||
|
<tr><td><code>New_Tai_Lue</code></td><td>New Tai Lue (aka Simplified Tai Lue)</td></tr>
|
||
|
<tr><td><code>Nko</code></td><td>Nko</td></tr>
|
||
|
<tr><td><code>Ogham</code></td><td>Ogham</td></tr>
|
||
|
<tr><td><code>Ol_Chiki</code></td><td>Ol Chiki</td></tr>
|
||
|
<tr><td><code>Old_Italic</code></td><td>Old Italic</td></tr>
|
||
|
<tr><td><code>Old_Persian</code></td><td>Old Persian</td></tr>
|
||
|
<tr><td><code>Oriya</code></td><td>Oriya</td></tr>
|
||
|
<tr><td><code>Osmanya</code></td><td>Osmanya</td></tr>
|
||
|
<tr><td><code>Phags_Pa</code></td><td>'Phags Pa</td></tr>
|
||
|
<tr><td><code>Phoenician</code></td><td>Phoenician</td></tr>
|
||
|
<tr><td><code>Rejang</code></td><td>Rejang</td></tr>
|
||
|
<tr><td><code>Runic</code></td><td>Runic</td></tr>
|
||
|
<tr><td><code>Saurashtra</code></td><td>Saurashtra</td></tr>
|
||
|
<tr><td><code>Shavian</code></td><td>Shavian</td></tr>
|
||
|
<tr><td><code>Sinhala</code></td><td>Sinhala</td></tr>
|
||
|
<tr><td><code>Sundanese</code></td><td>Sundanese</td></tr>
|
||
|
<tr><td><code>Syloti_Nagri</code></td><td>Syloti Nagri</td></tr>
|
||
|
<tr><td><code>Syriac</code></td><td>Syriac</td></tr>
|
||
|
<tr><td><code>Tagalog</code></td><td>Tagalog</td></tr>
|
||
|
<tr><td><code>Tagbanwa</code></td><td>Tagbanwa</td></tr>
|
||
|
<tr><td><code>Tai_Le</code></td><td>Tai Le</td></tr>
|
||
|
<tr><td><code>Tamil</code></td><td>Tamil</td></tr>
|
||
|
<tr><td><code>Telugu</code></td><td>Telugu</td></tr>
|
||
|
<tr><td><code>Thaana</code></td><td>Thaana</td></tr>
|
||
|
<tr><td><code>Thai</code></td><td>Thai</td></tr>
|
||
|
<tr><td><code>Tibetan</code></td><td>Tibetan</td></tr>
|
||
|
<tr><td><code>Tifinagh</code></td><td>Tifinagh</td></tr>
|
||
|
<tr><td><code>Ugaritic</code></td><td>Ugaritic</td></tr>
|
||
|
<tr><td><code>Vai</code></td><td>Vai</td></tr>
|
||
|
<tr><td><code>Yi</code></td><td>Yi</td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Vim character classes:</b></td></tr>
|
||
|
<tr><td><code><font color=#808080>\i</font></code></td><td>identifier character <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\I</font></code></td><td><code>\i</code> except digits <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\k</font></code></td><td>keyword character <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\K</font></code></td><td><code>\k</code> except digits <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\f</font></code></td><td>file name character <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\F</font></code></td><td><code>\f</code> except digits <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\p</font></code></td><td>printable character <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\P</font></code></td><td><code>\p</code> except digits <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\s</font></code></td><td>whitespace character (≡ <code>[ \t]</code>) <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\S</font></code></td><td>non-white space character (≡ <code>[^ \t]</code>) <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code>\d</code></td><td>digits (≡ <code>[0-9]</code>) <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code>\D</code></td><td>not <code>\d</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\x</font></code></td><td>hex digits (≡ <code>[0-9A-Fa-f]</code>) <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\X</font></code></td><td>not <code>\x</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\o</font></code></td><td>octal digits (≡ <code>[0-7]</code>) <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\O</font></code></td><td>not <code>\o</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code>\w</code></td><td>word character <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code>\W</code></td><td>not <code>\w</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\h</font></code></td><td>head of word character <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\H</font></code></td><td>not <code>\h</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\a</font></code></td><td>alphabetic <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\A</font></code></td><td>not <code>\a</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\l</font></code></td><td>lowercase <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\L</font></code></td><td>not lowercase <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\u</font></code></td><td>uppercase <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\U</font></code></td><td>not uppercase <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\_x</font></code></td><td><code>\x</code> plus newline, for any <code>x</code> <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Vim flags:</b></td></tr>
|
||
|
<tr><td><code><font color=#808080>\c</font></code></td><td>ignore case <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\C</font></code></td><td>match case <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\m</font></code></td><td>magic <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\M</font></code></td><td>nomagic <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\v</font></code></td><td>verymagic <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\V</font></code></td><td>verynomagic <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>\Z</font></code></td><td>ignore differences in Unicode combining characters <font size=-2>VIM</font></td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
<tr><td colspan=2><b>Magic:</b></td></tr>
|
||
|
<tr><td><code><font color=#808080>(?{code})</font></code></td><td>arbitrary Perl code <font size=-2>PERL</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>(??{code})</font></code></td><td>postponed arbitrary Perl code <font size=-2>PERL</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>(?n)</font></code></td><td>recursive call to regexp capturing group <code>n</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?+n)</font></code></td><td>recursive call to relative group <code>+n</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?-n)</font></code></td><td>recursive call to relative group <code>-n</code> </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?C)</font></code></td><td>PCRE callout <font size=-2>PCRE</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>(?R)</font></code></td><td>recursive call to entire regexp (≡ <code>(?0)</code>) </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?&name)</font></code></td><td>recursive call to named group </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?P=name)</font></code></td><td>named backreference </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?P>name)</font></code></td><td>recursive call to named group </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?(cond)true|false)</font></code></td><td>conditional branch </td></tr>
|
||
|
<tr><td><code><font color=#808080>(?(cond)true)</font></code></td><td>conditional branch </td></tr>
|
||
|
<tr><td><code><font color=#808080>(*ACCEPT)</font></code></td><td>make regexps more like Prolog </td></tr>
|
||
|
<tr><td><code><font color=#808080>(*COMMIT)</font></code></td><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*F)</font></code></td><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*FAIL)</font></code></td><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*MARK)</font></code></td><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*PRUNE)</font></code></td><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*SKIP)</font></code></td><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*THEN)</font></code></td><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*ANY)</font></code></td><td>set newline convention </td></tr>
|
||
|
<tr><td><code><font color=#808080>(*ANYCRLF)</font></code></td><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*CR)</font></code></td><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*CRLF)</font></code></td><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*LF)</font></code></td><td></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*BSR_ANYCRLF)</font></code></td><td>set \R convention <font size=-2>PCRE</font></td></tr>
|
||
|
<tr><td><code><font color=#808080>(*BSR_UNICODE)</font></code></td><td> <font size=-2>PCRE</font></td></tr>
|
||
|
<tr><td></td></tr>
|
||
|
</table>
|
||
|
</body>
|
||
|
</html>
|