Sophie

Sophie

distrib > Mandriva > 9.1 > ppc > by-pkgid > a74ec78bdb789d910d054e3918f3f007 > files > 578

libsword1-devel-1.5.5-2mdk.ppc.rpm

<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.0 Transitional//EN">
<html><head><meta http-equiv="Content-Type" content="text/html;charset=iso-8859-1">
<title>utf8utf16.cpp Source File</title>
<link href="doxygen.css" rel="stylesheet" type="text/css">
</head><body>
<!-- Generated by Doxygen 1.2.15 -->
<center>
<a class="qindex" href="index.html">Main Page</a> &nbsp; <a class="qindex" href="namespaces.html">Namespace List</a> &nbsp; <a class="qindex" href="hierarchy.html">Class Hierarchy</a> &nbsp; <a class="qindex" href="classes.html">Alphabetical List</a> &nbsp; <a class="qindex" href="annotated.html">Compound List</a> &nbsp; <a class="qindex" href="files.html">File List</a> &nbsp; <a class="qindex" href="functions.html">Compound Members</a> &nbsp; </center>
<hr><h1>utf8utf16.cpp</h1><div class="fragment"><pre>00001 <font class="comment">/******************************************************************************</font>
00002 <font class="comment"> *</font>
00003 <font class="comment"> * UTF8UTF16 -  SWFilter decendant to convert UTF-8 to UTF-16</font>
00004 <font class="comment"> *</font>
00005 <font class="comment"> */</font>
00006 
00007 <font class="preprocessor">#include &lt;stdlib.h&gt;</font>
00008 <font class="preprocessor">#include &lt;stdio.h&gt;</font>
00009 
00010 <font class="preprocessor">#include &lt;utf8utf16.h&gt;</font>
00011 
00012 UTF8UTF16::UTF8UTF16() {
00013 }
00014 
00015 
00016 <font class="keywordtype">char</font> UTF8UTF16::ProcessText(<font class="keywordtype">char</font> *text, <font class="keywordtype">int</font> maxlen, <font class="keyword">const</font> <a class="code" href="class_s_w_key.html">SWKey</a> *key, <font class="keyword">const</font> <a class="code" href="class_s_w_module.html">SWModule</a> *module)
00017 {
00018   <font class="keywordtype">unsigned</font> <font class="keywordtype">char</font> *from;
00019   <font class="keywordtype">unsigned</font> <font class="keywordtype">short</font> *to;
00020 
00021   <font class="keywordtype">int</font> len;
00022   <font class="keywordtype">unsigned</font> <font class="keywordtype">long</font> uchar;
00023   <font class="keywordtype">unsigned</font> <font class="keywordtype">char</font> significantFirstBits, subsequent;
00024   <font class="keywordtype">unsigned</font> <font class="keywordtype">short</font> schar;
00025   
00026   len = strlen(text) + 1;                                               <font class="comment">// shift string to right of buffer</font>
00027   <font class="keywordflow">if</font> (len &lt; maxlen) {
00028     memmove(&amp;text[maxlen - len], text, len);
00029     from = (<font class="keywordtype">unsigned</font> <font class="keywordtype">char</font>*)&amp;text[maxlen - len];
00030   }
00031   <font class="keywordflow">else</font>
00032     from = (<font class="keywordtype">unsigned</font> <font class="keywordtype">char</font>*)text;
00033   
00034   
00035   <font class="comment">// -------------------------------</font>
00036   
00037   <font class="keywordflow">for</font> (to = (<font class="keywordtype">unsigned</font> <font class="keywordtype">short</font>*)text; *from; from++) {
00038     uchar = 0;
00039     <font class="keywordflow">if</font> ((*from &amp; 128) != 128) {
00040       <font class="comment">//                if (*from != ' ')</font>
00041       uchar = *from;
00042     }
00043     <font class="keywordflow">else</font> <font class="keywordflow">if</font> ((*from &amp; 128) &amp;&amp; ((*from &amp; 64) != 64)) {
00044       <font class="comment">// error, do nothing</font>
00045       <font class="keywordflow">continue</font>;
00046     }
00047     <font class="keywordflow">else</font> {
00048       *from &lt;&lt;= 1;
00049       <font class="keywordflow">for</font> (subsequent = 1; (*from &amp; 128); subsequent++) {
00050         *from &lt;&lt;= 1;
00051         from[subsequent] &amp;= 63;
00052         uchar &lt;&lt;= 6;
00053         uchar |= from[subsequent];
00054       }
00055       subsequent--;
00056       *from &lt;&lt;=1;
00057       significantFirstBits = 8 - (2+subsequent);
00058       
00059       uchar |= (((short)*from) &lt;&lt; (((6*subsequent)+significantFirstBits)-8));
00060       from += subsequent;
00061     }
00062 
00063     <font class="keywordflow">if</font> (uchar &lt; 0x1ffff) {
00064       *to++ = (<font class="keywordtype">unsigned</font> <font class="keywordtype">short</font>)uchar;
00065     }
00066     <font class="keywordflow">else</font> {
00067       uchar -= 0x10000;
00068       schar = 0xD800 | (uchar &amp; 0x03ff);
00069       uchar &gt;&gt;= 10;
00070       uchar |= 0xDC00;
00071       *to++ = (<font class="keywordtype">unsigned</font> <font class="keywordtype">short</font>)schar;
00072       *to++ = (<font class="keywordtype">unsigned</font> <font class="keywordtype">short</font>)uchar;
00073     }
00074   }
00075   *to = (<font class="keywordtype">unsigned</font> <font class="keywordtype">short</font>)0;
00076 
00077   <font class="keywordflow">return</font> 0;
00078 }
00079 
</pre></div><hr><address align="right"><small>Generated on Thu Jun 20 22:13:01 2002 for The Sword Project by
<a href="http://www.doxygen.org/index.html">
<img src="doxygen.png" alt="doxygen" align="middle" border=0 
width=110 height=53></a>1.2.15 </small></address>
</body>
</html>