<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN"> <html><head><meta http-equiv="Content-Type" content="text/html;charset=iso-8859-1"> <title>ICU 3.8: utf8.h Source File</title> <link href="doxygen.css" rel="stylesheet" type="text/css"> <link href="tabs.css" rel="stylesheet" type="text/css"> </head><body> <!-- Generated by Doxygen 1.5.1 --> <div class="tabs"> <ul> <li><a href="index.html"><span>Main Page</span></a></li> <li><a href="modules.html"><span>Modules</span></a></li> <li><a href="classes.html"><span>Data Structures</span></a></li> <li id="current"><a href="files.html"><span>Files</span></a></li> <li><a href="pages.html"><span>Related Pages</span></a></li> <li> <form action="search.php" method="get"> <table cellspacing="0" cellpadding="0" border="0"> <tr> <td><label> <u>S</u>earch for </label></td> <td><input type="text" name="query" value="" size="20" accesskey="s"/></td> </tr> </table> </form> </li> </ul></div> <div class="tabs"> <ul> <li><a href="files.html"><span>File List</span></a></li> <li><a href="globals.html"><span>Globals</span></a></li> </ul></div> <h1>utf8.h</h1><a href="utf8_8h.html">Go to the documentation of this file.</a><div class="fragment"><pre class="fragment"><a name="l00001"></a>00001 <span class="comment">/*</span> <a name="l00002"></a>00002 <span class="comment">*******************************************************************************</span> <a name="l00003"></a>00003 <span class="comment">*</span> <a name="l00004"></a>00004 <span class="comment">* Copyright (C) 1999-2007, International Business Machines</span> <a name="l00005"></a>00005 <span class="comment">* Corporation and others. All Rights Reserved.</span> <a name="l00006"></a>00006 <span class="comment">*</span> <a name="l00007"></a>00007 <span class="comment">*******************************************************************************</span> <a name="l00008"></a>00008 <span class="comment">* file name: utf8.h</span> <a name="l00009"></a>00009 <span class="comment">* encoding: US-ASCII</span> <a name="l00010"></a>00010 <span class="comment">* tab size: 8 (not used)</span> <a name="l00011"></a>00011 <span class="comment">* indentation:4</span> <a name="l00012"></a>00012 <span class="comment">*</span> <a name="l00013"></a>00013 <span class="comment">* created on: 1999sep13</span> <a name="l00014"></a>00014 <span class="comment">* created by: Markus W. Scherer</span> <a name="l00015"></a>00015 <span class="comment">*/</span> <a name="l00016"></a>00016 <a name="l00034"></a>00034 <span class="preprocessor">#ifndef __UTF8_H__</span> <a name="l00035"></a>00035 <span class="preprocessor"></span><span class="preprocessor">#define __UTF8_H__</span> <a name="l00036"></a>00036 <span class="preprocessor"></span> <a name="l00037"></a>00037 <span class="comment">/* utf.h must be included first. */</span> <a name="l00038"></a>00038 <span class="preprocessor">#ifndef __UTF_H__</span> <a name="l00039"></a>00039 <span class="preprocessor"></span><span class="preprocessor"># include "<a class="code" href="utf_8h.html">unicode/utf.h</a>"</span> <a name="l00040"></a>00040 <span class="preprocessor">#endif</span> <a name="l00041"></a>00041 <span class="preprocessor"></span> <a name="l00042"></a>00042 <span class="comment">/* internal definitions ----------------------------------------------------- */</span> <a name="l00043"></a>00043 <a name="l00050"></a>00050 <span class="preprocessor">#ifdef U_UTF8_IMPL</span> <a name="l00051"></a>00051 <span class="preprocessor"></span><a class="code" href="platform_8h.html#7d78411159504c2d6770763f924a1792">U_EXPORT</a> <span class="keyword">const</span> <a class="code" href="platform_8h.html#ba7bc1797add20fe3efdf37ced1182c5">uint8_t</a> <a name="l00052"></a>00052 <span class="preprocessor">#elif defined(U_STATIC_IMPLEMENTATION) || defined(U_COMMON_IMPLEMENTATION)</span> <a name="l00053"></a>00053 <span class="preprocessor"></span><a class="code" href="umachine_8h.html#f702d65cba0638c5a8194cccc8d7c39e">U_CFUNC</a> <span class="keyword">const</span> <a class="code" href="platform_8h.html#ba7bc1797add20fe3efdf37ced1182c5">uint8_t</a> <a name="l00054"></a>00054 <span class="preprocessor">#else</span> <a name="l00055"></a>00055 <span class="preprocessor"></span><a class="code" href="umachine_8h.html#f702d65cba0638c5a8194cccc8d7c39e">U_CFUNC</a> <a class="code" href="platform_8h.html#4099e2ee510ce74ddacfc2010306b8b5">U_IMPORT</a> <span class="keyword">const</span> <a class="code" href="platform_8h.html#ba7bc1797add20fe3efdf37ced1182c5">uint8_t</a> <span class="comment">/* U_IMPORT2? */</span> <span class="comment">/*U_IMPORT*/</span> <a name="l00056"></a>00056 <span class="preprocessor">#endif</span> <a name="l00057"></a><a class="code" href="utf8_8h.html#4e3ae25d5856272ab60ab87c28572a99">00057</a> <span class="preprocessor"></span><a class="code" href="utf8_8h.html#4e3ae25d5856272ab60ab87c28572a99">utf8_countTrailBytes</a>[256]; <a name="l00058"></a>00058 <a name="l00063"></a><a class="code" href="utf8_8h.html#e534bfef078b4f5d09e8da543a779db7">00063</a> <span class="preprocessor">#define U8_COUNT_TRAIL_BYTES(leadByte) (utf8_countTrailBytes[(uint8_t)leadByte])</span> <a name="l00064"></a>00064 <span class="preprocessor"></span> <a name="l00069"></a><a class="code" href="utf8_8h.html#e8ed1045986b8bf27814e9bc78388961">00069</a> <span class="preprocessor">#define U8_MASK_LEAD_BYTE(leadByte, countTrailBytes) ((leadByte)&=(1<<(6-(countTrailBytes)))-1)</span> <a name="l00070"></a>00070 <span class="preprocessor"></span> <a name="l00075"></a>00075 <a class="code" href="umachine_8h.html#161dba69f4e479c3626793efc42f94ba">U_INTERNAL</a> <a class="code" href="umachine_8h.html#09fff5c3b5a5b015324dc3ec3cf92809">UChar32</a> <a class="code" href="platform_8h.html#72bf6d8ec0640a37b1915e5d853b2016">U_EXPORT2</a> <a name="l00076"></a>00076 <a class="code" href="utf8_8h.html#6eaf56eb54abb71eafcc0c347daa821f">utf8_nextCharSafeBody</a>(<span class="keyword">const</span> <a class="code" href="platform_8h.html#ba7bc1797add20fe3efdf37ced1182c5">uint8_t</a> *s, <a class="code" href="platform_8h.html#b1967d8591af1a4e48c37fd2b0f184d0">int32_t</a> *pi, <a class="code" href="platform_8h.html#b1967d8591af1a4e48c37fd2b0f184d0">int32_t</a> <a class="code" href="ucnv_8h.html#c2d59ccd7e4666434391eab17b0e304f">length</a>, <a class="code" href="umachine_8h.html#09fff5c3b5a5b015324dc3ec3cf92809">UChar32</a> c, <a class="code" href="umachine_8h.html#349ef00011f20ccd1d3b424445681aa5">UBool</a> strict); <a name="l00077"></a>00077 <a name="l00082"></a>00082 <a class="code" href="umachine_8h.html#161dba69f4e479c3626793efc42f94ba">U_INTERNAL</a> <a class="code" href="platform_8h.html#b1967d8591af1a4e48c37fd2b0f184d0">int32_t</a> <a class="code" href="platform_8h.html#72bf6d8ec0640a37b1915e5d853b2016">U_EXPORT2</a> <a name="l00083"></a>00083 <a class="code" href="utf8_8h.html#6cf17491f1c237bbe5b002056b830fd3">utf8_appendCharSafeBody</a>(<a class="code" href="platform_8h.html#ba7bc1797add20fe3efdf37ced1182c5">uint8_t</a> *s, <a class="code" href="platform_8h.html#b1967d8591af1a4e48c37fd2b0f184d0">int32_t</a> i, <a class="code" href="platform_8h.html#b1967d8591af1a4e48c37fd2b0f184d0">int32_t</a> <a class="code" href="ucnv_8h.html#c2d59ccd7e4666434391eab17b0e304f">length</a>, <a class="code" href="umachine_8h.html#09fff5c3b5a5b015324dc3ec3cf92809">UChar32</a> c, <a class="code" href="umachine_8h.html#349ef00011f20ccd1d3b424445681aa5">UBool</a> *pIsError); <a name="l00084"></a>00084 <a name="l00089"></a>00089 <a class="code" href="umachine_8h.html#161dba69f4e479c3626793efc42f94ba">U_INTERNAL</a> <a class="code" href="umachine_8h.html#09fff5c3b5a5b015324dc3ec3cf92809">UChar32</a> <a class="code" href="platform_8h.html#72bf6d8ec0640a37b1915e5d853b2016">U_EXPORT2</a> <a name="l00090"></a>00090 <a class="code" href="utf8_8h.html#2bbae41d2d845750088a17dc55f59096">utf8_prevCharSafeBody</a>(<span class="keyword">const</span> <a class="code" href="platform_8h.html#ba7bc1797add20fe3efdf37ced1182c5">uint8_t</a> *s, <a class="code" href="platform_8h.html#b1967d8591af1a4e48c37fd2b0f184d0">int32_t</a> start, <a class="code" href="platform_8h.html#b1967d8591af1a4e48c37fd2b0f184d0">int32_t</a> *pi, <a class="code" href="umachine_8h.html#09fff5c3b5a5b015324dc3ec3cf92809">UChar32</a> c, <a class="code" href="umachine_8h.html#349ef00011f20ccd1d3b424445681aa5">UBool</a> strict); <a name="l00091"></a>00091 <a name="l00096"></a>00096 <a class="code" href="umachine_8h.html#161dba69f4e479c3626793efc42f94ba">U_INTERNAL</a> <a class="code" href="platform_8h.html#b1967d8591af1a4e48c37fd2b0f184d0">int32_t</a> <a class="code" href="platform_8h.html#72bf6d8ec0640a37b1915e5d853b2016">U_EXPORT2</a> <a name="l00097"></a>00097 <a class="code" href="utf8_8h.html#4017310e2ecadac7dea5a432a33ccf30">utf8_back1SafeBody</a>(<span class="keyword">const</span> <a class="code" href="platform_8h.html#ba7bc1797add20fe3efdf37ced1182c5">uint8_t</a> *s, <a class="code" href="platform_8h.html#b1967d8591af1a4e48c37fd2b0f184d0">int32_t</a> start, <a class="code" href="platform_8h.html#b1967d8591af1a4e48c37fd2b0f184d0">int32_t</a> i); <a name="l00098"></a>00098 <a name="l00099"></a>00099 <span class="comment">/* single-code point definitions -------------------------------------------- */</span> <a name="l00100"></a>00100 <a name="l00107"></a><a class="code" href="utf8_8h.html#8f3a9427d880458a9fa6b169a3cc1b3c">00107</a> <span class="preprocessor">#define U8_IS_SINGLE(c) (((c)&0x80)==0)</span> <a name="l00108"></a>00108 <span class="preprocessor"></span> <a name="l00115"></a><a class="code" href="utf8_8h.html#db9837ea38dd811524a5b761ddc2a2ca">00115</a> <span class="preprocessor">#define U8_IS_LEAD(c) ((uint8_t)((c)-0xc0)<0x3e)</span> <a name="l00116"></a>00116 <span class="preprocessor"></span> <a name="l00123"></a><a class="code" href="utf8_8h.html#fed9fc9bf480bf15a2e6051774f2d80e">00123</a> <span class="preprocessor">#define U8_IS_TRAIL(c) (((c)&0xc0)==0x80)</span> <a name="l00124"></a>00124 <span class="preprocessor"></span> <a name="l00132"></a><a class="code" href="utf8_8h.html#f1730b8bbb3053465ee58702821846f1">00132</a> <span class="preprocessor">#define U8_LENGTH(c) \</span> <a name="l00133"></a>00133 <span class="preprocessor"> ((uint32_t)(c)<=0x7f ? 1 : \</span> <a name="l00134"></a>00134 <span class="preprocessor"> ((uint32_t)(c)<=0x7ff ? 2 : \</span> <a name="l00135"></a>00135 <span class="preprocessor"> ((uint32_t)(c)<=0xd7ff ? 3 : \</span> <a name="l00136"></a>00136 <span class="preprocessor"> ((uint32_t)(c)<=0xdfff || (uint32_t)(c)>0x10ffff ? 0 : \</span> <a name="l00137"></a>00137 <span class="preprocessor"> ((uint32_t)(c)<=0xffff ? 3 : 4)\</span> <a name="l00138"></a>00138 <span class="preprocessor"> ) \</span> <a name="l00139"></a>00139 <span class="preprocessor"> ) \</span> <a name="l00140"></a>00140 <span class="preprocessor"> ) \</span> <a name="l00141"></a>00141 <span class="preprocessor"> )</span> <a name="l00142"></a>00142 <span class="preprocessor"></span> <a name="l00148"></a><a class="code" href="utf8_8h.html#a2298b48749d9f45772c8f5a6885464a">00148</a> <span class="preprocessor">#define U8_MAX_LENGTH 4</span> <a name="l00149"></a>00149 <span class="preprocessor"></span> <a name="l00166"></a><a class="code" href="utf8_8h.html#125e5e7a4ef2f3f57b078f706b2b67f8">00166</a> <span class="preprocessor">#define U8_GET_UNSAFE(s, i, c) { \</span> <a name="l00167"></a>00167 <span class="preprocessor"> int32_t _u8_get_unsafe_index=(int32_t)(i); \</span> <a name="l00168"></a>00168 <span class="preprocessor"> U8_SET_CP_START_UNSAFE(s, _u8_get_unsafe_index); \</span> <a name="l00169"></a>00169 <span class="preprocessor"> U8_NEXT_UNSAFE(s, _u8_get_unsafe_index, c); \</span> <a name="l00170"></a>00170 <span class="preprocessor">}</span> <a name="l00171"></a>00171 <span class="preprocessor"></span> <a name="l00190"></a><a class="code" href="utf8_8h.html#10a57a084d75604c4a81fb5eec46ae6a">00190</a> <span class="preprocessor">#define U8_GET(s, start, i, length, c) { \</span> <a name="l00191"></a>00191 <span class="preprocessor"> int32_t _u8_get_index=(int32_t)(i); \</span> <a name="l00192"></a>00192 <span class="preprocessor"> U8_SET_CP_START(s, start, _u8_get_index); \</span> <a name="l00193"></a>00193 <span class="preprocessor"> U8_NEXT(s, _u8_get_index, length, c); \</span> <a name="l00194"></a>00194 <span class="preprocessor">}</span> <a name="l00195"></a>00195 <span class="preprocessor"></span> <a name="l00196"></a>00196 <span class="comment">/* definitions with forward iteration --------------------------------------- */</span> <a name="l00197"></a>00197 <a name="l00215"></a><a class="code" href="utf8_8h.html#28ecdb4233301285fc4ce7f9ea1ed644">00215</a> <span class="preprocessor">#define U8_NEXT_UNSAFE(s, i, c) { \</span> <a name="l00216"></a>00216 <span class="preprocessor"> (c)=(uint8_t)(s)[(i)++]; \</span> <a name="l00217"></a>00217 <span class="preprocessor"> if((uint8_t)((c)-0xc0)<0x35) { \</span> <a name="l00218"></a>00218 <span class="preprocessor"> uint8_t __count=U8_COUNT_TRAIL_BYTES(c); \</span> <a name="l00219"></a>00219 <span class="preprocessor"> U8_MASK_LEAD_BYTE(c, __count); \</span> <a name="l00220"></a>00220 <span class="preprocessor"> switch(__count) { \</span> <a name="l00221"></a>00221 <span class="preprocessor"> </span><span class="comment">/* each following branch falls through to the next one */</span> \ <a name="l00222"></a>00222 case 3: \ <a name="l00223"></a>00223 (c)=((c)<<6)|((s)[(i)++]&0x3f); \ <a name="l00224"></a>00224 case 2: \ <a name="l00225"></a>00225 (c)=((c)<<6)|((s)[(i)++]&0x3f); \ <a name="l00226"></a>00226 case 1: \ <a name="l00227"></a>00227 (c)=((c)<<6)|((s)[(i)++]&0x3f); \ <a name="l00228"></a>00228 <span class="comment">/* no other branches to optimize switch() */</span> \ <a name="l00229"></a>00229 break; \ <a name="l00230"></a>00230 } \ <a name="l00231"></a>00231 } \ <a name="l00232"></a>00232 } <a name="l00233"></a>00233 <a name="l00252"></a><a class="code" href="utf8_8h.html#57f3e5429ae4edb27a42367c627aa482">00252</a> <span class="preprocessor">#define U8_NEXT(s, i, length, c) { \</span> <a name="l00253"></a>00253 <span class="preprocessor"> (c)=(uint8_t)(s)[(i)++]; \</span> <a name="l00254"></a>00254 <span class="preprocessor"> if((c)>=0x80) { \</span> <a name="l00255"></a>00255 <span class="preprocessor"> uint8_t __t1, __t2; \</span> <a name="l00256"></a>00256 <span class="preprocessor"> if( </span><span class="comment">/* handle U+1000..U+CFFF inline */</span> \ <a name="l00257"></a>00257 (0xe0<(c) && (c)<=0xec) && \ <a name="l00258"></a>00258 (((i)+1)<(length)) && \ <a name="l00259"></a>00259 (__t1=(uint8_t)((s)[i]-0x80))<=0x3f && \ <a name="l00260"></a>00260 (__t2=(uint8_t)((s)[(i)+1]-0x80))<= 0x3f \ <a name="l00261"></a>00261 ) { \ <a name="l00262"></a>00262 <span class="comment">/* no need for (c&0xf) because the upper bits are truncated after <<12 in the cast to (UChar) */</span> \ <a name="l00263"></a>00263 (c)=(UChar)(((c)<<12)|(__t1<<6)|__t2); \ <a name="l00264"></a>00264 (i)+=2; \ <a name="l00265"></a>00265 } else if( <span class="comment">/* handle U+0080..U+07FF inline */</span> \ <a name="l00266"></a>00266 ((c)<0xe0 && (c)>=0xc2) && \ <a name="l00267"></a>00267 ((i)<(length)) && \ <a name="l00268"></a>00268 (__t1=(uint8_t)((s)[i]-0x80))<=0x3f \ <a name="l00269"></a>00269 ) { \ <a name="l00270"></a>00270 (c)=(UChar)((((c)&0x1f)<<6)|__t1); \ <a name="l00271"></a>00271 ++(i); \ <a name="l00272"></a>00272 } else if(U8_IS_LEAD(c)) { \ <a name="l00273"></a>00273 <span class="comment">/* function call for "complicated" and error cases */</span> \ <a name="l00274"></a>00274 (c)=utf8_nextCharSafeBody((const uint8_t *)s, &(i), (int32_t)(length), c, -1); \ <a name="l00275"></a>00275 } else { \ <a name="l00276"></a>00276 (c)=U_SENTINEL; \ <a name="l00277"></a>00277 } \ <a name="l00278"></a>00278 } \ <a name="l00279"></a>00279 } <a name="l00280"></a>00280 <a name="l00294"></a><a class="code" href="utf8_8h.html#154f04764da5af41729c4df6bf9e09f3">00294</a> <span class="preprocessor">#define U8_APPEND_UNSAFE(s, i, c) { \</span> <a name="l00295"></a>00295 <span class="preprocessor"> if((uint32_t)(c)<=0x7f) { \</span> <a name="l00296"></a>00296 <span class="preprocessor"> (s)[(i)++]=(uint8_t)(c); \</span> <a name="l00297"></a>00297 <span class="preprocessor"> } else { \</span> <a name="l00298"></a>00298 <span class="preprocessor"> if((uint32_t)(c)<=0x7ff) { \</span> <a name="l00299"></a>00299 <span class="preprocessor"> (s)[(i)++]=(uint8_t)(((c)>>6)|0xc0); \</span> <a name="l00300"></a>00300 <span class="preprocessor"> } else { \</span> <a name="l00301"></a>00301 <span class="preprocessor"> if((uint32_t)(c)<=0xffff) { \</span> <a name="l00302"></a>00302 <span class="preprocessor"> (s)[(i)++]=(uint8_t)(((c)>>12)|0xe0); \</span> <a name="l00303"></a>00303 <span class="preprocessor"> } else { \</span> <a name="l00304"></a>00304 <span class="preprocessor"> (s)[(i)++]=(uint8_t)(((c)>>18)|0xf0); \</span> <a name="l00305"></a>00305 <span class="preprocessor"> (s)[(i)++]=(uint8_t)((((c)>>12)&0x3f)|0x80); \</span> <a name="l00306"></a>00306 <span class="preprocessor"> } \</span> <a name="l00307"></a>00307 <span class="preprocessor"> (s)[(i)++]=(uint8_t)((((c)>>6)&0x3f)|0x80); \</span> <a name="l00308"></a>00308 <span class="preprocessor"> } \</span> <a name="l00309"></a>00309 <span class="preprocessor"> (s)[(i)++]=(uint8_t)(((c)&0x3f)|0x80); \</span> <a name="l00310"></a>00310 <span class="preprocessor"> } \</span> <a name="l00311"></a>00311 <span class="preprocessor">}</span> <a name="l00312"></a>00312 <span class="preprocessor"></span> <a name="l00330"></a><a class="code" href="utf8_8h.html#8a013997e3d13c501ce73bc45e662881">00330</a> <span class="preprocessor">#define U8_APPEND(s, i, capacity, c, isError) { \</span> <a name="l00331"></a>00331 <span class="preprocessor"> if((uint32_t)(c)<=0x7f) { \</span> <a name="l00332"></a>00332 <span class="preprocessor"> (s)[(i)++]=(uint8_t)(c); \</span> <a name="l00333"></a>00333 <span class="preprocessor"> } else if((uint32_t)(c)<=0x7ff && (i)+1<(capacity)) { \</span> <a name="l00334"></a>00334 <span class="preprocessor"> (s)[(i)++]=(uint8_t)(((c)>>6)|0xc0); \</span> <a name="l00335"></a>00335 <span class="preprocessor"> (s)[(i)++]=(uint8_t)(((c)&0x3f)|0x80); \</span> <a name="l00336"></a>00336 <span class="preprocessor"> } else if((uint32_t)(c)<=0xd7ff && (i)+2<(capacity)) { \</span> <a name="l00337"></a>00337 <span class="preprocessor"> (s)[(i)++]=(uint8_t)(((c)>>12)|0xe0); \</span> <a name="l00338"></a>00338 <span class="preprocessor"> (s)[(i)++]=(uint8_t)((((c)>>6)&0x3f)|0x80); \</span> <a name="l00339"></a>00339 <span class="preprocessor"> (s)[(i)++]=(uint8_t)(((c)&0x3f)|0x80); \</span> <a name="l00340"></a>00340 <span class="preprocessor"> } else { \</span> <a name="l00341"></a>00341 <span class="preprocessor"> (i)=utf8_appendCharSafeBody(s, (int32_t)(i), (int32_t)(capacity), c, &(isError)); \</span> <a name="l00342"></a>00342 <span class="preprocessor"> } \</span> <a name="l00343"></a>00343 <span class="preprocessor">}</span> <a name="l00344"></a>00344 <span class="preprocessor"></span> <a name="l00355"></a><a class="code" href="utf8_8h.html#64a8113aea2125f806cbf5d77294b3cd">00355</a> <span class="preprocessor">#define U8_FWD_1_UNSAFE(s, i) { \</span> <a name="l00356"></a>00356 <span class="preprocessor"> (i)+=1+U8_COUNT_TRAIL_BYTES((s)[i]); \</span> <a name="l00357"></a>00357 <span class="preprocessor">}</span> <a name="l00358"></a>00358 <span class="preprocessor"></span> <a name="l00370"></a><a class="code" href="utf8_8h.html#6d4c94e845b059fddba0c51e9bad87fd">00370</a> <span class="preprocessor">#define U8_FWD_1(s, i, length) { \</span> <a name="l00371"></a>00371 <span class="preprocessor"> uint8_t __b=(uint8_t)(s)[(i)++]; \</span> <a name="l00372"></a>00372 <span class="preprocessor"> if(U8_IS_LEAD(__b)) { \</span> <a name="l00373"></a>00373 <span class="preprocessor"> uint8_t __count=U8_COUNT_TRAIL_BYTES(__b); \</span> <a name="l00374"></a>00374 <span class="preprocessor"> if((i)+__count>(length)) { \</span> <a name="l00375"></a>00375 <span class="preprocessor"> __count=(uint8_t)((length)-(i)); \</span> <a name="l00376"></a>00376 <span class="preprocessor"> } \</span> <a name="l00377"></a>00377 <span class="preprocessor"> while(__count>0 && U8_IS_TRAIL((s)[i])) { \</span> <a name="l00378"></a>00378 <span class="preprocessor"> ++(i); \</span> <a name="l00379"></a>00379 <span class="preprocessor"> --__count; \</span> <a name="l00380"></a>00380 <span class="preprocessor"> } \</span> <a name="l00381"></a>00381 <span class="preprocessor"> } \</span> <a name="l00382"></a>00382 <span class="preprocessor">}</span> <a name="l00383"></a>00383 <span class="preprocessor"></span> <a name="l00396"></a><a class="code" href="utf8_8h.html#8e8b4218834110431798cc84a0a664ae">00396</a> <span class="preprocessor">#define U8_FWD_N_UNSAFE(s, i, n) { \</span> <a name="l00397"></a>00397 <span class="preprocessor"> int32_t __N=(n); \</span> <a name="l00398"></a>00398 <span class="preprocessor"> while(__N>0) { \</span> <a name="l00399"></a>00399 <span class="preprocessor"> U8_FWD_1_UNSAFE(s, i); \</span> <a name="l00400"></a>00400 <span class="preprocessor"> --__N; \</span> <a name="l00401"></a>00401 <span class="preprocessor"> } \</span> <a name="l00402"></a>00402 <span class="preprocessor">}</span> <a name="l00403"></a>00403 <span class="preprocessor"></span> <a name="l00417"></a><a class="code" href="utf8_8h.html#9a311dc48b8aa1050345b886adabf213">00417</a> <span class="preprocessor">#define U8_FWD_N(s, i, length, n) { \</span> <a name="l00418"></a>00418 <span class="preprocessor"> int32_t __N=(n); \</span> <a name="l00419"></a>00419 <span class="preprocessor"> while(__N>0 && (i)<(length)) { \</span> <a name="l00420"></a>00420 <span class="preprocessor"> U8_FWD_1(s, i, length); \</span> <a name="l00421"></a>00421 <span class="preprocessor"> --__N; \</span> <a name="l00422"></a>00422 <span class="preprocessor"> } \</span> <a name="l00423"></a>00423 <span class="preprocessor">}</span> <a name="l00424"></a>00424 <span class="preprocessor"></span> <a name="l00438"></a><a class="code" href="utf8_8h.html#c46a385dbf64c97337522e1d1875a57e">00438</a> <span class="preprocessor">#define U8_SET_CP_START_UNSAFE(s, i) { \</span> <a name="l00439"></a>00439 <span class="preprocessor"> while(U8_IS_TRAIL((s)[i])) { --(i); } \</span> <a name="l00440"></a>00440 <span class="preprocessor">}</span> <a name="l00441"></a>00441 <span class="preprocessor"></span> <a name="l00456"></a><a class="code" href="utf8_8h.html#a6d33627a8a5420a8f61e50da2aeca2a">00456</a> <span class="preprocessor">#define U8_SET_CP_START(s, start, i) { \</span> <a name="l00457"></a>00457 <span class="preprocessor"> if(U8_IS_TRAIL((s)[(i)])) { \</span> <a name="l00458"></a>00458 <span class="preprocessor"> (i)=utf8_back1SafeBody(s, start, (int32_t)(i)); \</span> <a name="l00459"></a>00459 <span class="preprocessor"> } \</span> <a name="l00460"></a>00460 <span class="preprocessor">}</span> <a name="l00461"></a>00461 <span class="preprocessor"></span> <a name="l00462"></a>00462 <span class="comment">/* definitions with backward iteration -------------------------------------- */</span> <a name="l00463"></a>00463 <a name="l00483"></a><a class="code" href="utf8_8h.html#5f78eb19a6b25f61dccbae45d6ecf955">00483</a> <span class="preprocessor">#define U8_PREV_UNSAFE(s, i, c) { \</span> <a name="l00484"></a>00484 <span class="preprocessor"> (c)=(uint8_t)(s)[--(i)]; \</span> <a name="l00485"></a>00485 <span class="preprocessor"> if(U8_IS_TRAIL(c)) { \</span> <a name="l00486"></a>00486 <span class="preprocessor"> uint8_t __b, __count=1, __shift=6; \</span> <a name="l00487"></a>00487 <span class="preprocessor">\</span> <a name="l00488"></a>00488 <span class="preprocessor"> </span><span class="comment">/* c is a trail byte */</span> \ <a name="l00489"></a>00489 (c)&=0x3f; \ <a name="l00490"></a>00490 for(;;) { \ <a name="l00491"></a>00491 __b=(uint8_t)(s)[--(i)]; \ <a name="l00492"></a>00492 if(__b>=0xc0) { \ <a name="l00493"></a>00493 U8_MASK_LEAD_BYTE(__b, __count); \ <a name="l00494"></a>00494 (c)|=(UChar32)__b<<__shift; \ <a name="l00495"></a>00495 break; \ <a name="l00496"></a>00496 } else { \ <a name="l00497"></a>00497 (c)|=(UChar32)(__b&0x3f)<<__shift; \ <a name="l00498"></a>00498 ++__count; \ <a name="l00499"></a>00499 __shift+=6; \ <a name="l00500"></a>00500 } \ <a name="l00501"></a>00501 } \ <a name="l00502"></a>00502 } \ <a name="l00503"></a>00503 } <a name="l00504"></a>00504 <a name="l00525"></a><a class="code" href="utf8_8h.html#17287c1f01ce84fdf8852a756643b076">00525</a> <span class="preprocessor">#define U8_PREV(s, start, i, c) { \</span> <a name="l00526"></a>00526 <span class="preprocessor"> (c)=(uint8_t)(s)[--(i)]; \</span> <a name="l00527"></a>00527 <span class="preprocessor"> if((c)>=0x80) { \</span> <a name="l00528"></a>00528 <span class="preprocessor"> if((c)<=0xbf) { \</span> <a name="l00529"></a>00529 <span class="preprocessor"> (c)=utf8_prevCharSafeBody((const uint8_t *)s, start, &(i), c, -1); \</span> <a name="l00530"></a>00530 <span class="preprocessor"> } else { \</span> <a name="l00531"></a>00531 <span class="preprocessor"> (c)=U_SENTINEL; \</span> <a name="l00532"></a>00532 <span class="preprocessor"> } \</span> <a name="l00533"></a>00533 <span class="preprocessor"> } \</span> <a name="l00534"></a>00534 <span class="preprocessor">}</span> <a name="l00535"></a>00535 <span class="preprocessor"></span> <a name="l00547"></a><a class="code" href="utf8_8h.html#3969beb6252f8605ab678990c8af2f48">00547</a> <span class="preprocessor">#define U8_BACK_1_UNSAFE(s, i) { \</span> <a name="l00548"></a>00548 <span class="preprocessor"> while(U8_IS_TRAIL((s)[--(i)])) {} \</span> <a name="l00549"></a>00549 <span class="preprocessor">}</span> <a name="l00550"></a>00550 <span class="preprocessor"></span> <a name="l00563"></a><a class="code" href="utf8_8h.html#dac4ee359e6233cb2990b1047fd5be3c">00563</a> <span class="preprocessor">#define U8_BACK_1(s, start, i) { \</span> <a name="l00564"></a>00564 <span class="preprocessor"> if(U8_IS_TRAIL((s)[--(i)])) { \</span> <a name="l00565"></a>00565 <span class="preprocessor"> (i)=utf8_back1SafeBody(s, start, (int32_t)(i)); \</span> <a name="l00566"></a>00566 <span class="preprocessor"> } \</span> <a name="l00567"></a>00567 <span class="preprocessor">}</span> <a name="l00568"></a>00568 <span class="preprocessor"></span> <a name="l00582"></a><a class="code" href="utf8_8h.html#a36f62ea4ac87362e376e4cbea10098d">00582</a> <span class="preprocessor">#define U8_BACK_N_UNSAFE(s, i, n) { \</span> <a name="l00583"></a>00583 <span class="preprocessor"> int32_t __N=(n); \</span> <a name="l00584"></a>00584 <span class="preprocessor"> while(__N>0) { \</span> <a name="l00585"></a>00585 <span class="preprocessor"> U8_BACK_1_UNSAFE(s, i); \</span> <a name="l00586"></a>00586 <span class="preprocessor"> --__N; \</span> <a name="l00587"></a>00587 <span class="preprocessor"> } \</span> <a name="l00588"></a>00588 <span class="preprocessor">}</span> <a name="l00589"></a>00589 <span class="preprocessor"></span> <a name="l00604"></a><a class="code" href="utf8_8h.html#b0ce585952c8ba4b103fb6b7aea801ba">00604</a> <span class="preprocessor">#define U8_BACK_N(s, start, i, n) { \</span> <a name="l00605"></a>00605 <span class="preprocessor"> int32_t __N=(n); \</span> <a name="l00606"></a>00606 <span class="preprocessor"> while(__N>0 && (i)>(start)) { \</span> <a name="l00607"></a>00607 <span class="preprocessor"> U8_BACK_1(s, start, i); \</span> <a name="l00608"></a>00608 <span class="preprocessor"> --__N; \</span> <a name="l00609"></a>00609 <span class="preprocessor"> } \</span> <a name="l00610"></a>00610 <span class="preprocessor">}</span> <a name="l00611"></a>00611 <span class="preprocessor"></span> <a name="l00625"></a><a class="code" href="utf8_8h.html#910ba47de6d82fafc25b5e12f3a68588">00625</a> <span class="preprocessor">#define U8_SET_CP_LIMIT_UNSAFE(s, i) { \</span> <a name="l00626"></a>00626 <span class="preprocessor"> U8_BACK_1_UNSAFE(s, i); \</span> <a name="l00627"></a>00627 <span class="preprocessor"> U8_FWD_1_UNSAFE(s, i); \</span> <a name="l00628"></a>00628 <span class="preprocessor">}</span> <a name="l00629"></a>00629 <span class="preprocessor"></span> <a name="l00645"></a><a class="code" href="utf8_8h.html#40fe523809a3a4e647e47513336b81d9">00645</a> <span class="preprocessor">#define U8_SET_CP_LIMIT(s, start, i, length) { \</span> <a name="l00646"></a>00646 <span class="preprocessor"> if((start)<(i) && (i)<(length)) { \</span> <a name="l00647"></a>00647 <span class="preprocessor"> U8_BACK_1(s, start, i); \</span> <a name="l00648"></a>00648 <span class="preprocessor"> U8_FWD_1(s, i, length); \</span> <a name="l00649"></a>00649 <span class="preprocessor"> } \</span> <a name="l00650"></a>00650 <span class="preprocessor">}</span> <a name="l00651"></a>00651 <span class="preprocessor"></span> <a name="l00652"></a>00652 <span class="preprocessor">#endif</span> </pre></div><hr size="1"><address style="align: right;"><small>Generated on Fri Sep 14 12:59:21 2007 for ICU 3.8 by <a href="http://www.doxygen.org/index.html"> <img src="doxygen.png" alt="doxygen" align="middle" border="0"></a> 1.5.1 </small></address> </body> </html>