1 | <!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.0 Transitional//EN"> |
---|
2 | <html> |
---|
3 | <head> |
---|
4 | <title>Boost.Regex: Character Class Names</title> |
---|
5 | <meta http-equiv="Content-Type" content="text/html; charset=iso-8859-1"> |
---|
6 | <link rel="stylesheet" type="text/css" href="../../../boost.css"> |
---|
7 | </head> |
---|
8 | <body> |
---|
9 | <P> |
---|
10 | <TABLE id="Table1" cellSpacing="1" cellPadding="1" width="100%" border="0"> |
---|
11 | <TR> |
---|
12 | <td valign="top" width="300"> |
---|
13 | <h3><a href="../../../index.htm"><img height="86" width="277" alt="C++ Boost" src="../../../boost.png" border="0"></a></h3> |
---|
14 | </td> |
---|
15 | <TD width="353"> |
---|
16 | <H1 align="center">Boost.Regex</H1> |
---|
17 | <H2 align="center">Character Class Names.</H2> |
---|
18 | </TD> |
---|
19 | <td width="50"> |
---|
20 | <h3><a href="index.html"><img height="45" width="43" alt="Boost.Regex Index" src="uarrow.gif" border="0"></a></h3> |
---|
21 | </td> |
---|
22 | </TR> |
---|
23 | </TABLE> |
---|
24 | </P> |
---|
25 | <HR> |
---|
26 | <p></p> |
---|
27 | <H3>Contents</H3> |
---|
28 | <dl class="index"> |
---|
29 | <dt><a href="#always">Character Classes that are Always Supported</a> <dt><a href="#unicode"> |
---|
30 | Character classes that are supported by Unicode Regular Expressions</a></dt> |
---|
31 | </dl> |
---|
32 | <H3><A name="always"></A>Character Classes that are Always Supported</H3> |
---|
33 | <P>The following character class names are always supported by Boost.Regex:</P> |
---|
34 | <P> |
---|
35 | <TABLE id="Table2" cellSpacing="1" cellPadding="1" width="100%" border="1"> |
---|
36 | <TR> |
---|
37 | <TD><STRONG>Name</STRONG></TD> |
---|
38 | <TD><STRONG>POSIX-standard name</STRONG></TD> |
---|
39 | <TD><STRONG>Description</STRONG></TD> |
---|
40 | </TR> |
---|
41 | <TR> |
---|
42 | <TD>alnum</TD> |
---|
43 | <TD>Yes</TD> |
---|
44 | <TD>Any alpha-numeric character.</TD> |
---|
45 | </TR> |
---|
46 | <TR> |
---|
47 | <TD>alpha</TD> |
---|
48 | <TD>Yes</TD> |
---|
49 | <TD>Any alphabetic character.</TD> |
---|
50 | </TR> |
---|
51 | <TR> |
---|
52 | <TD>blank</TD> |
---|
53 | <TD>Yes</TD> |
---|
54 | <TD>Any whitespace character that is not a line separator.</TD> |
---|
55 | </TR> |
---|
56 | <TR> |
---|
57 | <TD>cntrl</TD> |
---|
58 | <TD>Yes</TD> |
---|
59 | <TD>Any control character.</TD> |
---|
60 | </TR> |
---|
61 | <TR> |
---|
62 | <TD>d</TD> |
---|
63 | <TD>No</TD> |
---|
64 | <TD>Any decimal digit</TD> |
---|
65 | </TR> |
---|
66 | <TR> |
---|
67 | <TD>digit</TD> |
---|
68 | <TD>Yes</TD> |
---|
69 | <TD>Any decimal digit.</TD> |
---|
70 | </TR> |
---|
71 | <TR> |
---|
72 | <TD>graph</TD> |
---|
73 | <TD>Yes</TD> |
---|
74 | <TD>Any graphical character.</TD> |
---|
75 | </TR> |
---|
76 | <TR> |
---|
77 | <TD>l</TD> |
---|
78 | <TD>No</TD> |
---|
79 | <TD>Any lower case character.</TD> |
---|
80 | </TR> |
---|
81 | <TR> |
---|
82 | <TD>lower</TD> |
---|
83 | <TD>Yes</TD> |
---|
84 | <TD>Any lower case character.</TD> |
---|
85 | </TR> |
---|
86 | <TR> |
---|
87 | <TD>print</TD> |
---|
88 | <TD>Yes</TD> |
---|
89 | <TD>Any printable character.</TD> |
---|
90 | </TR> |
---|
91 | <TR> |
---|
92 | <TD>punct</TD> |
---|
93 | <TD>Yes</TD> |
---|
94 | <TD>Any punctuation character.</TD> |
---|
95 | </TR> |
---|
96 | <TR> |
---|
97 | <TD>s</TD> |
---|
98 | <TD>No</TD> |
---|
99 | <TD>Any whitespace character.</TD> |
---|
100 | </TR> |
---|
101 | <TR> |
---|
102 | <TD>space</TD> |
---|
103 | <TD>Yes</TD> |
---|
104 | <TD>Any whitespace character.</TD> |
---|
105 | </TR> |
---|
106 | <TR> |
---|
107 | <TD>unicode</TD> |
---|
108 | <TD>No</TD> |
---|
109 | <TD>Any extended character whose code point is above 255 in value.</TD> |
---|
110 | </TR> |
---|
111 | <TR> |
---|
112 | <TD>u</TD> |
---|
113 | <TD>No</TD> |
---|
114 | <TD>Any upper case character.</TD> |
---|
115 | </TR> |
---|
116 | <TR> |
---|
117 | <TD>upper</TD> |
---|
118 | <TD>Yes</TD> |
---|
119 | <TD>Any upper case character.</TD> |
---|
120 | </TR> |
---|
121 | <TR> |
---|
122 | <TD>w</TD> |
---|
123 | <TD>No</TD> |
---|
124 | <TD>Any word character (alphanumeric characters plus the underscore).</TD> |
---|
125 | </TR> |
---|
126 | <TR> |
---|
127 | <TD>word</TD> |
---|
128 | <TD>No</TD> |
---|
129 | <TD>Any word character (alphanumeric characters plus the underscore).</TD> |
---|
130 | </TR> |
---|
131 | <TR> |
---|
132 | <TD>xdigit</TD> |
---|
133 | <TD>Yes</TD> |
---|
134 | <TD>Any hexadecimal digit character.</TD> |
---|
135 | </TR> |
---|
136 | </TABLE> |
---|
137 | </P> |
---|
138 | <P> |
---|
139 | <H3><A name="unicode"></A>Character classes that are supported by Unicode Regular |
---|
140 | Expressions</H3> |
---|
141 | <P>The following character classes are only supported by <A href="icu_strings.html">Unicode |
---|
142 | Regular Expressions</A>: that is those that use the u32regex type. The |
---|
143 | names used are the same as those from <A href="http://www.unicode.org/versions/Unicode4.0.0/ch04.pdf#G124142"> |
---|
144 | Chapter 4 of the Unicode standard</A>.</P> |
---|
145 | <table width="100%" ID="Table3"> |
---|
146 | <tr> |
---|
147 | <td><b>Short Name</b></td> |
---|
148 | <td><b>Long Name</b></td> |
---|
149 | </tr> |
---|
150 | <tr> |
---|
151 | <td> |
---|
152 | </td> |
---|
153 | <td>ASCII</td> |
---|
154 | </tr> |
---|
155 | <tr> |
---|
156 | <td> |
---|
157 | </td> |
---|
158 | <td>Any</td> |
---|
159 | </tr> |
---|
160 | <tr> |
---|
161 | <td> |
---|
162 | </td> |
---|
163 | <td>Assigned</td> |
---|
164 | </tr> |
---|
165 | <tr> |
---|
166 | <td>C*</td> |
---|
167 | <td>Other</td> |
---|
168 | </tr> |
---|
169 | <tr> |
---|
170 | <td>Cc</td> |
---|
171 | <td>Control</td> |
---|
172 | </tr> |
---|
173 | <tr> |
---|
174 | <td>Cf</td> |
---|
175 | <td>Format</td> |
---|
176 | </tr> |
---|
177 | <tr> |
---|
178 | <td>Cn</td> |
---|
179 | <td>Not Assigned</td> |
---|
180 | </tr> |
---|
181 | <tr> |
---|
182 | <td>Co</td> |
---|
183 | <td>Private Use</td> |
---|
184 | </tr> |
---|
185 | <tr> |
---|
186 | <td>Cs</td> |
---|
187 | <td>Surrogate</td> |
---|
188 | </tr> |
---|
189 | <tr> |
---|
190 | <td>L*</td> |
---|
191 | <td>Letter</td> |
---|
192 | </tr> |
---|
193 | <tr> |
---|
194 | <td>Ll</td> |
---|
195 | <td>Lowercase Letter</td> |
---|
196 | </tr> |
---|
197 | <tr> |
---|
198 | <td>Lm</td> |
---|
199 | <td>Modifier Letter</td> |
---|
200 | </tr> |
---|
201 | <tr> |
---|
202 | <td>Lo</td> |
---|
203 | <td>Other Letter</td> |
---|
204 | </tr> |
---|
205 | <tr> |
---|
206 | <td>Lt</td> |
---|
207 | <td>Titlecase</td> |
---|
208 | </tr> |
---|
209 | <tr> |
---|
210 | <td>Lu</td> |
---|
211 | <td>Uppercase Letter</td> |
---|
212 | </tr> |
---|
213 | <tr> |
---|
214 | <td>M*</td> |
---|
215 | <td>Mark</td> |
---|
216 | </tr> |
---|
217 | <tr> |
---|
218 | <td>Mc</td> |
---|
219 | <td>Spacing Combining Mark</td> |
---|
220 | </tr> |
---|
221 | <tr> |
---|
222 | <td>Me</td> |
---|
223 | <td>Enclosing Mark</td> |
---|
224 | </tr> |
---|
225 | <tr> |
---|
226 | <td>Mn</td> |
---|
227 | <td>Non-Spacing Mark</td> |
---|
228 | </tr> |
---|
229 | <tr> |
---|
230 | <td>N*</td> |
---|
231 | <td>Number</td> |
---|
232 | </tr> |
---|
233 | <tr> |
---|
234 | <td>Nd</td> |
---|
235 | <td>Decimal Digit Number</td> |
---|
236 | </tr> |
---|
237 | <tr> |
---|
238 | <td>Nl</td> |
---|
239 | <td>Letter Number</td> |
---|
240 | </tr> |
---|
241 | <tr> |
---|
242 | <td>No</td> |
---|
243 | <td>Other Number</td> |
---|
244 | </tr> |
---|
245 | <tr> |
---|
246 | <td>P*</td> |
---|
247 | <td>Punctuation</td> |
---|
248 | </tr> |
---|
249 | <tr> |
---|
250 | <td>Pc</td> |
---|
251 | <td>Connector Punctuation</td> |
---|
252 | </tr> |
---|
253 | <tr> |
---|
254 | <td>Pd</td> |
---|
255 | <td>Dash Punctuation</td> |
---|
256 | </tr> |
---|
257 | <tr> |
---|
258 | <td>Pe</td> |
---|
259 | <td>Close Punctuation</td> |
---|
260 | </tr> |
---|
261 | <tr> |
---|
262 | <td>Pf</td> |
---|
263 | <td>Final Punctuation</td> |
---|
264 | </tr> |
---|
265 | <tr> |
---|
266 | <td>Pi</td> |
---|
267 | <td>Initial Punctuation</td> |
---|
268 | </tr> |
---|
269 | <tr> |
---|
270 | <td>Po</td> |
---|
271 | <td>Other Punctuation</td> |
---|
272 | </tr> |
---|
273 | <tr> |
---|
274 | <td>Ps</td> |
---|
275 | <td>Open Punctuation</td> |
---|
276 | </tr> |
---|
277 | <tr> |
---|
278 | <td>S*</td> |
---|
279 | <td>Symbol</td> |
---|
280 | </tr> |
---|
281 | <tr> |
---|
282 | <td>Sc</td> |
---|
283 | <td>Currency Symbol</td> |
---|
284 | </tr> |
---|
285 | <tr> |
---|
286 | <td>Sk</td> |
---|
287 | <td>Modifier Symbol</td> |
---|
288 | </tr> |
---|
289 | <tr> |
---|
290 | <td>Sm</td> |
---|
291 | <td>Math Symbol</td> |
---|
292 | </tr> |
---|
293 | <tr> |
---|
294 | <td>So</td> |
---|
295 | <td>Other Symbol</td> |
---|
296 | </tr> |
---|
297 | <tr> |
---|
298 | <td>Z*</td> |
---|
299 | <td>Separator</td> |
---|
300 | </tr> |
---|
301 | <tr> |
---|
302 | <td>Zl</td> |
---|
303 | <td>Line Separator</td> |
---|
304 | </tr> |
---|
305 | <tr> |
---|
306 | <td>Zp</td> |
---|
307 | <td>Paragraph Separator</td> |
---|
308 | </tr> |
---|
309 | <tr> |
---|
310 | <td>Zs</td> |
---|
311 | <td>Space Separator</td> |
---|
312 | </tr> |
---|
313 | </table> |
---|
314 | <HR> |
---|
315 | <P></P> |
---|
316 | <P></P> |
---|
317 | <p>Revised |
---|
318 | <!--webbot bot="Timestamp" S-Type="EDITED" S-Format="%d %B, %Y" startspan --> |
---|
319 | 10 Jan 2005 |
---|
320 | <!--webbot bot="Timestamp" endspan i-checksum="39359" --></p> |
---|
321 | <p><i>© Copyright John Maddock 2004-5</i></p> |
---|
322 | <P><I>Use, modification and distribution are subject to the Boost Software License, |
---|
323 | Version 1.0. (See accompanying file <A href="../../../LICENSE_1_0.txt">LICENSE_1_0.txt</A> |
---|
324 | or copy at <A href="http://www.boost.org/LICENSE_1_0.txt">http://www.boost.org/LICENSE_1_0.txt</A>)</I></P> |
---|
325 | </body> |
---|
326 | </html> |
---|