Sophie

Sophie

distrib > Fedora > 14 > x86_64 > by-pkgid > 8d1ef08c9e0d44c69764afc615a03d0d > files > 1711

ghc-ghc-devel-6.12.3-5.fc14.i686.rpm

<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
<html>
<head>
<!-- Generated by HsColour, http://www.cs.york.ac.uk/fp/darcs/hscolour/ -->
<title>utils/Encoding.hs</title>
<link type='text/css' rel='stylesheet' href='hscolour.css' />
</head>
<body>
<pre><a name="line-1"></a><span class='hs-comment'>{-# OPTIONS_GHC -O #-}</span>
<a name="line-2"></a><span class='hs-comment'>-- We always optimise this, otherwise performance of a non-optimised</span>
<a name="line-3"></a><span class='hs-comment'>-- compiler is severely affected</span>
<a name="line-4"></a>
<a name="line-5"></a><span class='hs-comment'>-- -----------------------------------------------------------------------------</span>
<a name="line-6"></a><span class='hs-comment'>--</span>
<a name="line-7"></a><span class='hs-comment'>-- (c) The University of Glasgow, 1997-2006</span>
<a name="line-8"></a><span class='hs-comment'>--</span>
<a name="line-9"></a><span class='hs-comment'>-- Character encodings</span>
<a name="line-10"></a><span class='hs-comment'>--</span>
<a name="line-11"></a><span class='hs-comment'>-- -----------------------------------------------------------------------------</span>
<a name="line-12"></a>
<a name="line-13"></a><span class='hs-keyword'>module</span> <span class='hs-conid'>Encoding</span> <span class='hs-layout'>(</span>
<a name="line-14"></a>        <span class='hs-comment'>-- * UTF-8</span>
<a name="line-15"></a>        <span class='hs-varid'>utf8DecodeChar</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span>
<a name="line-16"></a>        <span class='hs-varid'>utf8PrevChar</span><span class='hs-layout'>,</span>
<a name="line-17"></a>        <span class='hs-varid'>utf8CharStart</span><span class='hs-layout'>,</span>
<a name="line-18"></a>        <span class='hs-varid'>utf8DecodeChar</span><span class='hs-layout'>,</span>
<a name="line-19"></a>        <span class='hs-varid'>utf8DecodeString</span><span class='hs-layout'>,</span>
<a name="line-20"></a>        <span class='hs-varid'>utf8EncodeChar</span><span class='hs-layout'>,</span>
<a name="line-21"></a>        <span class='hs-varid'>utf8EncodeString</span><span class='hs-layout'>,</span>
<a name="line-22"></a>        <span class='hs-varid'>utf8EncodedLength</span><span class='hs-layout'>,</span>
<a name="line-23"></a>        <span class='hs-varid'>countUTF8Chars</span><span class='hs-layout'>,</span>
<a name="line-24"></a>
<a name="line-25"></a>        <span class='hs-comment'>-- * Z-encoding</span>
<a name="line-26"></a>        <span class='hs-varid'>zEncodeString</span><span class='hs-layout'>,</span>
<a name="line-27"></a>        <span class='hs-varid'>zDecodeString</span>
<a name="line-28"></a>  <span class='hs-layout'>)</span> <span class='hs-keyword'>where</span>
<a name="line-29"></a>
<a name="line-30"></a><span class='hs-cpp'>#include "HsVersions.h"</span>
<a name="line-31"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Foreign</span>
<a name="line-32"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>Char</span>
<a name="line-33"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Numeric</span>
<a name="line-34"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>GHC</span><span class='hs-varop'>.</span><span class='hs-conid'>Ptr</span>          <span class='hs-layout'>(</span> <span class='hs-conid'>Ptr</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span> <span class='hs-layout'>)</span>
<a name="line-35"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>GHC</span><span class='hs-varop'>.</span><span class='hs-conid'>Base</span>
<a name="line-36"></a>
<a name="line-37"></a><span class='hs-comment'>-- -----------------------------------------------------------------------------</span>
<a name="line-38"></a><span class='hs-comment'>-- UTF-8</span>
<a name="line-39"></a>
<a name="line-40"></a><span class='hs-comment'>-- We can't write the decoder as efficiently as we'd like without</span>
<a name="line-41"></a><span class='hs-comment'>-- resorting to unboxed extensions, unfortunately.  I tried to write</span>
<a name="line-42"></a><span class='hs-comment'>-- an IO version of this function, but GHC can't eliminate boxed</span>
<a name="line-43"></a><span class='hs-comment'>-- results from an IO-returning function.</span>
<a name="line-44"></a><span class='hs-comment'>--</span>
<a name="line-45"></a><span class='hs-comment'>-- We assume we can ignore overflow when parsing a multibyte character here.</span>
<a name="line-46"></a><span class='hs-comment'>-- To make this safe, we add extra sentinel bytes to unparsed UTF-8 sequences</span>
<a name="line-47"></a><span class='hs-comment'>-- before decoding them (see StringBuffer.hs).</span>
<a name="line-48"></a>
<a name="line-49"></a><a name="utf8DecodeChar"></a><span class='hs-comment'>{-# INLINE utf8DecodeChar# #-}</span>
<a name="line-50"></a><span class='hs-definition'>utf8DecodeChar</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Addr</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-conid'>Char</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-conid'>Addr</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span>
<a name="line-51"></a><span class='hs-definition'>utf8DecodeChar</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>=</span>
<a name="line-52"></a>  <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch0</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>0</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span>
<a name="line-53"></a>  <span class='hs-keyword'>case</span> <span class='hs-conid'>()</span> <span class='hs-keyword'>of</span>
<a name="line-54"></a>    <span class='hs-keyword'>_</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'>&lt;=#</span> <span class='hs-num'>0x7F</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>chr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>ch0</span><span class='hs-layout'>,</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span>
<a name="line-55"></a>
<a name="line-56"></a>      <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'>&gt;=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-varop'>&amp;&amp;</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'>&lt;=#</span> <span class='hs-num'>0xDF</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>-&gt;</span>
<a name="line-57"></a>        <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch1</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span>
<a name="line-58"></a>        <span class='hs-keyword'>if</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'>&lt;#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'>&gt;=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span>
<a name="line-59"></a>        <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>chr</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch0</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>6</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>+#</span>
<a name="line-60"></a>                  <span class='hs-layout'>(</span><span class='hs-varid'>ch1</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span>
<a name="line-61"></a>           <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>2</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span>
<a name="line-62"></a>
<a name="line-63"></a>      <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'>&gt;=#</span> <span class='hs-num'>0xE0</span><span class='hs-cpp'>#</span> <span class='hs-varop'>&amp;&amp;</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'>&lt;=#</span> <span class='hs-num'>0xEF</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>-&gt;</span>
<a name="line-64"></a>        <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch1</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span>
<a name="line-65"></a>        <span class='hs-keyword'>if</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'>&lt;#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'>&gt;=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span>
<a name="line-66"></a>        <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch2</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>2</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span>
<a name="line-67"></a>        <span class='hs-keyword'>if</span> <span class='hs-varid'>ch2</span> <span class='hs-varop'>&lt;#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch2</span> <span class='hs-varop'>&gt;=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>2</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span>
<a name="line-68"></a>        <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>chr</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch0</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0xE0</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>12</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>+#</span>
<a name="line-69"></a>                 <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch1</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>6</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span>  <span class='hs-varop'>+#</span>
<a name="line-70"></a>                  <span class='hs-layout'>(</span><span class='hs-varid'>ch2</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span>
<a name="line-71"></a>           <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>3</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span>
<a name="line-72"></a>
<a name="line-73"></a>     <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'>&gt;=#</span> <span class='hs-num'>0xF0</span><span class='hs-cpp'>#</span> <span class='hs-varop'>&amp;&amp;</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'>&lt;=#</span> <span class='hs-num'>0xF8</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>-&gt;</span>
<a name="line-74"></a>        <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch1</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span>
<a name="line-75"></a>        <span class='hs-keyword'>if</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'>&lt;#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'>&gt;=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span>
<a name="line-76"></a>        <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch2</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>2</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span>
<a name="line-77"></a>        <span class='hs-keyword'>if</span> <span class='hs-varid'>ch2</span> <span class='hs-varop'>&lt;#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch2</span> <span class='hs-varop'>&gt;=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>2</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span>
<a name="line-78"></a>        <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch3</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>3</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span>
<a name="line-79"></a>        <span class='hs-keyword'>if</span> <span class='hs-varid'>ch3</span> <span class='hs-varop'>&lt;#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch3</span> <span class='hs-varop'>&gt;=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>3</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span>
<a name="line-80"></a>        <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>chr</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch0</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0xF0</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>18</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>+#</span>
<a name="line-81"></a>                 <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch1</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>12</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>+#</span>
<a name="line-82"></a>                 <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch2</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>6</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span>  <span class='hs-varop'>+#</span>
<a name="line-83"></a>                  <span class='hs-layout'>(</span><span class='hs-varid'>ch3</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span>
<a name="line-84"></a>           <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>4</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span>
<a name="line-85"></a>
<a name="line-86"></a>      <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-varid'>fail</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span>
<a name="line-87"></a>  <span class='hs-keyword'>where</span>
<a name="line-88"></a>        <span class='hs-comment'>-- all invalid sequences end up here:</span>
<a name="line-89"></a>        <span class='hs-varid'>fail</span> <span class='hs-varid'>n</span> <span class='hs-keyglyph'>=</span> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-chr'>'\0'</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-varid'>n</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span>
<a name="line-90"></a>        <span class='hs-comment'>-- '\xFFFD' would be the usual replacement character, but</span>
<a name="line-91"></a>        <span class='hs-comment'>-- that's a valid symbol in Haskell, so will result in a</span>
<a name="line-92"></a>        <span class='hs-comment'>-- confusing parse error later on.  Instead we use '\0' which</span>
<a name="line-93"></a>        <span class='hs-comment'>-- will signal a lexer error immediately.</span>
<a name="line-94"></a>
<a name="line-95"></a><span class='hs-definition'>utf8DecodeChar</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-layout'>(</span><span class='hs-conid'>Char</span><span class='hs-layout'>,</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span><span class='hs-layout'>)</span>
<a name="line-96"></a><span class='hs-definition'>utf8DecodeChar</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span>
<a name="line-97"></a>  <span class='hs-keyword'>case</span> <span class='hs-varid'>utf8DecodeChar</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>of</span> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>c</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-varid'>b</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-layout'>(</span> <span class='hs-conid'>C</span><span class='hs-cpp'>#</span> <span class='hs-varid'>c</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-conid'>Ptr</span> <span class='hs-varid'>b</span><span class='hs-cpp'>#</span> <span class='hs-layout'>)</span>
<a name="line-98"></a>
<a name="line-99"></a><a name="utf8PrevChar"></a><span class='hs-comment'>-- UTF-8 is cleverly designed so that we can always figure out where</span>
<a name="line-100"></a><span class='hs-comment'>-- the start of the current character is, given any position in a</span>
<a name="line-101"></a><span class='hs-comment'>-- stream.  This function finds the start of the previous character,</span>
<a name="line-102"></a><span class='hs-comment'>-- assuming there *is* a previous character.</span>
<a name="line-103"></a><span class='hs-definition'>utf8PrevChar</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>IO</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span><span class='hs-layout'>)</span>
<a name="line-104"></a><span class='hs-definition'>utf8PrevChar</span> <span class='hs-varid'>p</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>utf8CharStart</span> <span class='hs-layout'>(</span><span class='hs-varid'>p</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-layout'>(</span><span class='hs-comment'>-</span><span class='hs-num'>1</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span>
<a name="line-105"></a>
<a name="line-106"></a><a name="utf8CharStart"></a><span class='hs-definition'>utf8CharStart</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>IO</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span><span class='hs-layout'>)</span>
<a name="line-107"></a><span class='hs-definition'>utf8CharStart</span> <span class='hs-varid'>p</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-varid'>p</span>
<a name="line-108"></a> <span class='hs-keyword'>where</span> <span class='hs-varid'>go</span> <span class='hs-varid'>p</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>do</span> <span class='hs-varid'>w</span> <span class='hs-keyglyph'>&lt;-</span> <span class='hs-varid'>peek</span> <span class='hs-varid'>p</span>
<a name="line-109"></a>                 <span class='hs-keyword'>if</span> <span class='hs-varid'>w</span> <span class='hs-varop'>&gt;=</span> <span class='hs-num'>0x80</span> <span class='hs-varop'>&amp;&amp;</span> <span class='hs-varid'>w</span> <span class='hs-varop'>&lt;</span> <span class='hs-num'>0xC0</span>
<a name="line-110"></a>                        <span class='hs-keyword'>then</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>p</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-layout'>(</span><span class='hs-comment'>-</span><span class='hs-num'>1</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span>
<a name="line-111"></a>                        <span class='hs-keyword'>else</span> <span class='hs-varid'>return</span> <span class='hs-varid'>p</span>
<a name="line-112"></a>
<a name="line-113"></a><a name="utf8DecodeString"></a><span class='hs-definition'>utf8DecodeString</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Int</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>IO</span> <span class='hs-keyglyph'>[</span><span class='hs-conid'>Char</span><span class='hs-keyglyph'>]</span>
<a name="line-114"></a><span class='hs-conid'>STRICT2</span><span class='hs-layout'>(</span><span class='hs-varid'>utf8DecodeString</span><span class='hs-layout'>)</span>
<a name="line-115"></a><span class='hs-definition'>utf8DecodeString</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-layout'>(</span><span class='hs-conid'>I</span><span class='hs-cpp'>#</span> <span class='hs-varid'>len</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span>
<a name="line-116"></a>  <span class='hs-keyglyph'>=</span> <span class='hs-varid'>unpack</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span>
<a name="line-117"></a>  <span class='hs-keyword'>where</span>
<a name="line-118"></a>    <span class='hs-varop'>!</span><span class='hs-varid'>end</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>addr2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-varid'>len</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span>
<a name="line-119"></a>
<a name="line-120"></a>    <span class='hs-varid'>unpack</span> <span class='hs-varid'>p</span><span class='hs-cpp'>#</span>
<a name="line-121"></a>        <span class='hs-keyglyph'>|</span> <span class='hs-varid'>addr2Int</span><span class='hs-cpp'>#</span> <span class='hs-varid'>p</span><span class='hs-cpp'>#</span> <span class='hs-varop'>&gt;=#</span> <span class='hs-varid'>end</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>return</span> <span class='hs-conid'>[]</span>
<a name="line-122"></a>        <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span>  <span class='hs-keyglyph'>=</span>
<a name="line-123"></a>        <span class='hs-keyword'>case</span> <span class='hs-varid'>utf8DecodeChar</span><span class='hs-cpp'>#</span> <span class='hs-varid'>p</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>of</span>
<a name="line-124"></a>           <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>c</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-varid'>q</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-keyword'>do</span>
<a name="line-125"></a>                <span class='hs-varid'>chs</span> <span class='hs-keyglyph'>&lt;-</span> <span class='hs-varid'>unpack</span> <span class='hs-varid'>q</span><span class='hs-cpp'>#</span>
<a name="line-126"></a>                <span class='hs-varid'>return</span> <span class='hs-layout'>(</span><span class='hs-conid'>C</span><span class='hs-cpp'>#</span> <span class='hs-varid'>c</span><span class='hs-cpp'>#</span> <span class='hs-conop'>:</span> <span class='hs-varid'>chs</span><span class='hs-layout'>)</span>
<a name="line-127"></a>
<a name="line-128"></a><a name="countUTF8Chars"></a><span class='hs-definition'>countUTF8Chars</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Int</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>IO</span> <span class='hs-conid'>Int</span>
<a name="line-129"></a><span class='hs-definition'>countUTF8Chars</span> <span class='hs-varid'>ptr</span> <span class='hs-varid'>bytes</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>0</span>
<a name="line-130"></a>  <span class='hs-keyword'>where</span>
<a name="line-131"></a>        <span class='hs-varid'>end</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>ptr</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-varid'>bytes</span>
<a name="line-132"></a>
<a name="line-133"></a>        <span class='hs-conid'>STRICT2</span><span class='hs-layout'>(</span><span class='hs-varid'>go</span><span class='hs-layout'>)</span>
<a name="line-134"></a>        <span class='hs-varid'>go</span> <span class='hs-varid'>ptr</span> <span class='hs-varid'>n</span>
<a name="line-135"></a>           <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ptr</span> <span class='hs-varop'>&gt;=</span> <span class='hs-varid'>end</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>return</span> <span class='hs-varid'>n</span>
<a name="line-136"></a>           <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span>  <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>do</span>
<a name="line-137"></a>                <span class='hs-keyword'>case</span> <span class='hs-varid'>utf8DecodeChar</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>unPtr</span> <span class='hs-varid'>ptr</span><span class='hs-layout'>)</span> <span class='hs-keyword'>of</span>
<a name="line-138"></a>                  <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>_</span><span class='hs-layout'>,</span> <span class='hs-varid'>a</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-varid'>a</span><span class='hs-layout'>)</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>1</span><span class='hs-layout'>)</span>
<a name="line-139"></a>
<a name="line-140"></a><a name="unPtr"></a><span class='hs-definition'>unPtr</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-varid'>a</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Addr</span><span class='hs-cpp'>#</span>
<a name="line-141"></a><span class='hs-definition'>unPtr</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-varid'>a</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>a</span>
<a name="line-142"></a>
<a name="line-143"></a><a name="utf8EncodeChar"></a><span class='hs-definition'>utf8EncodeChar</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>IO</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span><span class='hs-layout'>)</span>
<a name="line-144"></a><span class='hs-definition'>utf8EncodeChar</span> <span class='hs-varid'>c</span> <span class='hs-varid'>ptr</span> <span class='hs-keyglyph'>=</span>
<a name="line-145"></a>  <span class='hs-keyword'>let</span> <span class='hs-varid'>x</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>ord</span> <span class='hs-varid'>c</span> <span class='hs-keyword'>in</span>
<a name="line-146"></a>  <span class='hs-keyword'>case</span> <span class='hs-conid'>()</span> <span class='hs-keyword'>of</span>
<a name="line-147"></a>    <span class='hs-keyword'>_</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>x</span> <span class='hs-varop'>&gt;</span> <span class='hs-num'>0</span> <span class='hs-varop'>&amp;&amp;</span> <span class='hs-varid'>x</span> <span class='hs-varop'>&lt;=</span> <span class='hs-num'>0x007f</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-keyword'>do</span>
<a name="line-148"></a>          <span class='hs-varid'>poke</span> <span class='hs-varid'>ptr</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-varid'>x</span><span class='hs-layout'>)</span>
<a name="line-149"></a>          <span class='hs-varid'>return</span> <span class='hs-layout'>(</span><span class='hs-varid'>ptr</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-num'>1</span><span class='hs-layout'>)</span>
<a name="line-150"></a>        <span class='hs-comment'>-- NB. '\0' is encoded as '\xC0\x80', not '\0'.  This is so that we</span>
<a name="line-151"></a>        <span class='hs-comment'>-- can have 0-terminated UTF-8 strings (see GHC.Base.unpackCStringUtf8).</span>
<a name="line-152"></a>      <span class='hs-keyglyph'>|</span> <span class='hs-varid'>x</span> <span class='hs-varop'>&lt;=</span> <span class='hs-num'>0x07ff</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-keyword'>do</span>
<a name="line-153"></a>          <span class='hs-varid'>poke</span> <span class='hs-varid'>ptr</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0xC0</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>6</span><span class='hs-layout'>)</span> <span class='hs-varop'>.&amp;.</span> <span class='hs-num'>0x1F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span>
<a name="line-154"></a>          <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>1</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>.&amp;.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span>
<a name="line-155"></a>          <span class='hs-varid'>return</span> <span class='hs-layout'>(</span><span class='hs-varid'>ptr</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-num'>2</span><span class='hs-layout'>)</span>
<a name="line-156"></a>      <span class='hs-keyglyph'>|</span> <span class='hs-varid'>x</span> <span class='hs-varop'>&lt;=</span> <span class='hs-num'>0xffff</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-keyword'>do</span>
<a name="line-157"></a>          <span class='hs-varid'>poke</span> <span class='hs-varid'>ptr</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0xE0</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>12</span><span class='hs-layout'>)</span> <span class='hs-varop'>.&amp;.</span> <span class='hs-num'>0x0F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span>
<a name="line-158"></a>          <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>1</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>6</span><span class='hs-layout'>)</span> <span class='hs-varop'>.&amp;.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span>
<a name="line-159"></a>          <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>2</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>.&amp;.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span>
<a name="line-160"></a>          <span class='hs-varid'>return</span> <span class='hs-layout'>(</span><span class='hs-varid'>ptr</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-num'>3</span><span class='hs-layout'>)</span>
<a name="line-161"></a>      <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-keyword'>do</span>
<a name="line-162"></a>          <span class='hs-varid'>poke</span> <span class='hs-varid'>ptr</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0xF0</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>18</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span>
<a name="line-163"></a>          <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>1</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>12</span><span class='hs-layout'>)</span> <span class='hs-varop'>.&amp;.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span>
<a name="line-164"></a>          <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>2</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>6</span><span class='hs-layout'>)</span> <span class='hs-varop'>.&amp;.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span>
<a name="line-165"></a>          <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>3</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>.&amp;.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span>
<a name="line-166"></a>          <span class='hs-varid'>return</span> <span class='hs-layout'>(</span><span class='hs-varid'>ptr</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-num'>4</span><span class='hs-layout'>)</span>
<a name="line-167"></a>
<a name="line-168"></a><a name="utf8EncodeString"></a><span class='hs-definition'>utf8EncodeString</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>String</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>IO</span> <span class='hs-conid'>()</span>
<a name="line-169"></a><span class='hs-definition'>utf8EncodeString</span> <span class='hs-varid'>ptr</span> <span class='hs-varid'>str</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-varid'>ptr</span> <span class='hs-varid'>str</span>
<a name="line-170"></a>  <span class='hs-keyword'>where</span> <span class='hs-conid'>STRICT2</span><span class='hs-layout'>(</span><span class='hs-varid'>go</span><span class='hs-layout'>)</span>
<a name="line-171"></a>        <span class='hs-varid'>go</span> <span class='hs-keyword'>_</span>   <span class='hs-conid'>[]</span>     <span class='hs-keyglyph'>=</span> <span class='hs-varid'>return</span> <span class='hs-conid'>()</span>
<a name="line-172"></a>        <span class='hs-varid'>go</span> <span class='hs-varid'>ptr</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span><span class='hs-conop'>:</span><span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>do</span>
<a name="line-173"></a>          <span class='hs-varid'>ptr'</span> <span class='hs-keyglyph'>&lt;-</span> <span class='hs-varid'>utf8EncodeChar</span> <span class='hs-varid'>c</span> <span class='hs-varid'>ptr</span>
<a name="line-174"></a>          <span class='hs-varid'>go</span> <span class='hs-varid'>ptr'</span> <span class='hs-varid'>cs</span>
<a name="line-175"></a>
<a name="line-176"></a><a name="utf8EncodedLength"></a><span class='hs-definition'>utf8EncodedLength</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>String</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Int</span>
<a name="line-177"></a><span class='hs-definition'>utf8EncodedLength</span> <span class='hs-varid'>str</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-num'>0</span> <span class='hs-varid'>str</span>
<a name="line-178"></a>  <span class='hs-keyword'>where</span> <span class='hs-conid'>STRICT2</span><span class='hs-layout'>(</span><span class='hs-varid'>go</span><span class='hs-layout'>)</span>
<a name="line-179"></a>        <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-conid'>[]</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>n</span>
<a name="line-180"></a>        <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span><span class='hs-conop'>:</span><span class='hs-varid'>cs</span><span class='hs-layout'>)</span>
<a name="line-181"></a>          <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ord</span> <span class='hs-varid'>c</span> <span class='hs-varop'>&gt;</span> <span class='hs-num'>0</span> <span class='hs-varop'>&amp;&amp;</span> <span class='hs-varid'>ord</span> <span class='hs-varid'>c</span> <span class='hs-varop'>&lt;=</span> <span class='hs-num'>0x007f</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span>
<a name="line-182"></a>          <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ord</span> <span class='hs-varid'>c</span> <span class='hs-varop'>&lt;=</span> <span class='hs-num'>0x07ff</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>2</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span>
<a name="line-183"></a>          <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ord</span> <span class='hs-varid'>c</span> <span class='hs-varop'>&lt;=</span> <span class='hs-num'>0xffff</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>3</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span>
<a name="line-184"></a>          <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span>       <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>4</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span>
<a name="line-185"></a>
<a name="line-186"></a><span class='hs-comment'>-- -----------------------------------------------------------------------------</span>
<a name="line-187"></a><span class='hs-comment'>-- The Z-encoding</span>
<a name="line-188"></a>
<a name="line-189"></a><span class='hs-comment'>{-
<a name="line-190"></a>This is the main name-encoding and decoding function.  It encodes any
<a name="line-191"></a>string into a string that is acceptable as a C name.  This is done
<a name="line-192"></a>right before we emit a symbol name into the compiled C or asm code.
<a name="line-193"></a>Z-encoding of strings is cached in the FastString interface, so we
<a name="line-194"></a>never encode the same string more than once.
<a name="line-195"></a>
<a name="line-196"></a>The basic encoding scheme is this.
<a name="line-197"></a>
<a name="line-198"></a>* Tuples (,,,) are coded as Z3T
<a name="line-199"></a>
<a name="line-200"></a>* Alphabetic characters (upper and lower) and digits
<a name="line-201"></a>        all translate to themselves;
<a name="line-202"></a>        except 'Z', which translates to 'ZZ'
<a name="line-203"></a>        and    'z', which translates to 'zz'
<a name="line-204"></a>  We need both so that we can preserve the variable/tycon distinction
<a name="line-205"></a>
<a name="line-206"></a>* Most other printable characters translate to 'zx' or 'Zx' for some
<a name="line-207"></a>        alphabetic character x
<a name="line-208"></a>
<a name="line-209"></a>* The others translate as 'znnnU' where 'nnn' is the decimal number
<a name="line-210"></a>        of the character
<a name="line-211"></a>
<a name="line-212"></a>        Before          After
<a name="line-213"></a>        --------------------------
<a name="line-214"></a>        Trak            Trak
<a name="line-215"></a>        foo_wib         foozuwib
<a name="line-216"></a>        &gt;               zg
<a name="line-217"></a>        &gt;1              zg1
<a name="line-218"></a>        foo#            foozh
<a name="line-219"></a>        foo##           foozhzh
<a name="line-220"></a>        foo##1          foozhzh1
<a name="line-221"></a>        fooZ            fooZZ
<a name="line-222"></a>        :+              ZCzp
<a name="line-223"></a>        ()              Z0T     0-tuple
<a name="line-224"></a>        (,,,,)          Z5T     5-tuple
<a name="line-225"></a>        (# #)           Z1H     unboxed 1-tuple (note the space)
<a name="line-226"></a>        (#,,,,#)        Z5H     unboxed 5-tuple
<a name="line-227"></a>                (NB: There is no Z1T nor Z0H.)
<a name="line-228"></a>-}</span>
<a name="line-229"></a>
<a name="line-230"></a><a name="UserString"></a><span class='hs-keyword'>type</span> <span class='hs-conid'>UserString</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>String</span>        <span class='hs-comment'>-- As the user typed it</span>
<a name="line-231"></a><a name="EncodedString"></a><span class='hs-keyword'>type</span> <span class='hs-conid'>EncodedString</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>String</span>     <span class='hs-comment'>-- Encoded form</span>
<a name="line-232"></a>
<a name="line-233"></a>
<a name="line-234"></a><a name="zEncodeString"></a><span class='hs-definition'>zEncodeString</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>UserString</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>EncodedString</span>
<a name="line-235"></a><span class='hs-definition'>zEncodeString</span> <span class='hs-varid'>cs</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>case</span> <span class='hs-varid'>maybe_tuple</span> <span class='hs-varid'>cs</span> <span class='hs-keyword'>of</span>
<a name="line-236"></a>                <span class='hs-conid'>Just</span> <span class='hs-varid'>n</span>  <span class='hs-keyglyph'>-&gt;</span> <span class='hs-varid'>n</span>            <span class='hs-comment'>-- Tuples go to Z2T etc</span>
<a name="line-237"></a>                <span class='hs-conid'>Nothing</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-varid'>go</span> <span class='hs-varid'>cs</span>
<a name="line-238"></a>          <span class='hs-keyword'>where</span>
<a name="line-239"></a>                <span class='hs-varid'>go</span> <span class='hs-conid'>[]</span>     <span class='hs-keyglyph'>=</span> <span class='hs-conid'>[]</span>
<a name="line-240"></a>                <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span><span class='hs-conop'>:</span><span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>encode_digit_ch</span> <span class='hs-varid'>c</span> <span class='hs-varop'>++</span> <span class='hs-varid'>go'</span> <span class='hs-varid'>cs</span>
<a name="line-241"></a>                <span class='hs-varid'>go'</span> <span class='hs-conid'>[]</span>     <span class='hs-keyglyph'>=</span> <span class='hs-conid'>[]</span>
<a name="line-242"></a>                <span class='hs-varid'>go'</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span><span class='hs-conop'>:</span><span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>encode_ch</span> <span class='hs-varid'>c</span> <span class='hs-varop'>++</span> <span class='hs-varid'>go'</span> <span class='hs-varid'>cs</span>
<a name="line-243"></a>
<a name="line-244"></a><a name="unencodedChar"></a><span class='hs-definition'>unencodedChar</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Bool</span>   <span class='hs-comment'>-- True for chars that don't need encoding</span>
<a name="line-245"></a><span class='hs-definition'>unencodedChar</span> <span class='hs-chr'>'Z'</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>False</span>
<a name="line-246"></a><span class='hs-definition'>unencodedChar</span> <span class='hs-chr'>'z'</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>False</span>
<a name="line-247"></a><span class='hs-definition'>unencodedChar</span> <span class='hs-varid'>c</span>   <span class='hs-keyglyph'>=</span>  <span class='hs-varid'>c</span> <span class='hs-varop'>&gt;=</span> <span class='hs-chr'>'a'</span> <span class='hs-varop'>&amp;&amp;</span> <span class='hs-varid'>c</span> <span class='hs-varop'>&lt;=</span> <span class='hs-chr'>'z'</span>
<a name="line-248"></a>                  <span class='hs-varop'>||</span> <span class='hs-varid'>c</span> <span class='hs-varop'>&gt;=</span> <span class='hs-chr'>'A'</span> <span class='hs-varop'>&amp;&amp;</span> <span class='hs-varid'>c</span> <span class='hs-varop'>&lt;=</span> <span class='hs-chr'>'Z'</span>
<a name="line-249"></a>                  <span class='hs-varop'>||</span> <span class='hs-varid'>c</span> <span class='hs-varop'>&gt;=</span> <span class='hs-chr'>'0'</span> <span class='hs-varop'>&amp;&amp;</span> <span class='hs-varid'>c</span> <span class='hs-varop'>&lt;=</span> <span class='hs-chr'>'9'</span>
<a name="line-250"></a>
<a name="line-251"></a><a name="encode_digit_ch"></a><span class='hs-comment'>-- If a digit is at the start of a symbol then we need to encode it.</span>
<a name="line-252"></a><span class='hs-comment'>-- Otherwise package names like 9pH-0.1 give linker errors.</span>
<a name="line-253"></a><span class='hs-definition'>encode_digit_ch</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>EncodedString</span>
<a name="line-254"></a><span class='hs-definition'>encode_digit_ch</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>c</span> <span class='hs-varop'>&gt;=</span> <span class='hs-chr'>'0'</span> <span class='hs-varop'>&amp;&amp;</span> <span class='hs-varid'>c</span> <span class='hs-varop'>&lt;=</span> <span class='hs-chr'>'9'</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>encode_as_unicode_char</span> <span class='hs-varid'>c</span>
<a name="line-255"></a><span class='hs-definition'>encode_digit_ch</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span>            <span class='hs-keyglyph'>=</span> <span class='hs-varid'>encode_ch</span> <span class='hs-varid'>c</span>
<a name="line-256"></a>
<a name="line-257"></a><a name="encode_ch"></a><span class='hs-definition'>encode_ch</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>EncodedString</span>
<a name="line-258"></a><span class='hs-definition'>encode_ch</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>unencodedChar</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyglyph'>[</span><span class='hs-varid'>c</span><span class='hs-keyglyph'>]</span>     <span class='hs-comment'>-- Common case first</span>
<a name="line-259"></a>
<a name="line-260"></a><span class='hs-comment'>-- Constructors</span>
<a name="line-261"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'('</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZL"</span>   <span class='hs-comment'>-- Needed for things like (,), and (-&gt;)</span>
<a name="line-262"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>')'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZR"</span>   <span class='hs-comment'>-- For symmetry with (</span>
<a name="line-263"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'['</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZM"</span>
<a name="line-264"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>']'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZN"</span>
<a name="line-265"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>':'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZC"</span>
<a name="line-266"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'Z'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZZ"</span>
<a name="line-267"></a>
<a name="line-268"></a><span class='hs-comment'>-- Variables</span>
<a name="line-269"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'z'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zz"</span>
<a name="line-270"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'&amp;'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"za"</span>
<a name="line-271"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'|'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zb"</span>
<a name="line-272"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'^'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zc"</span>
<a name="line-273"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'$'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zd"</span>
<a name="line-274"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'='</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ze"</span>
<a name="line-275"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'&gt;'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zg"</span>
<a name="line-276"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'#'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zh"</span>
<a name="line-277"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'.'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zi"</span>
<a name="line-278"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'&lt;'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zl"</span>
<a name="line-279"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'-'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zm"</span>
<a name="line-280"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'!'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zn"</span>
<a name="line-281"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'+'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zp"</span>
<a name="line-282"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'\''</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zq"</span>
<a name="line-283"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'\\'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zr"</span>
<a name="line-284"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'/'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zs"</span>
<a name="line-285"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'*'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zt"</span>
<a name="line-286"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'_'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zu"</span>
<a name="line-287"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'%'</span>  <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zv"</span>
<a name="line-288"></a><span class='hs-definition'>encode_ch</span> <span class='hs-varid'>c</span>    <span class='hs-keyglyph'>=</span> <span class='hs-varid'>encode_as_unicode_char</span> <span class='hs-varid'>c</span>
<a name="line-289"></a>
<a name="line-290"></a><a name="encode_as_unicode_char"></a><span class='hs-definition'>encode_as_unicode_char</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>EncodedString</span>
<a name="line-291"></a><span class='hs-definition'>encode_as_unicode_char</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'z'</span> <span class='hs-conop'>:</span> <span class='hs-keyword'>if</span> <span class='hs-varid'>isDigit</span> <span class='hs-layout'>(</span><span class='hs-varid'>head</span> <span class='hs-varid'>hex_str</span><span class='hs-layout'>)</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>hex_str</span>
<a name="line-292"></a>                                                           <span class='hs-keyword'>else</span> <span class='hs-chr'>'0'</span><span class='hs-conop'>:</span><span class='hs-varid'>hex_str</span>
<a name="line-293"></a>  <span class='hs-keyword'>where</span> <span class='hs-varid'>hex_str</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>showHex</span> <span class='hs-layout'>(</span><span class='hs-varid'>ord</span> <span class='hs-varid'>c</span><span class='hs-layout'>)</span> <span class='hs-str'>"U"</span>
<a name="line-294"></a>  <span class='hs-comment'>-- ToDo: we could improve the encoding here in various ways.</span>
<a name="line-295"></a>  <span class='hs-comment'>-- eg. strings of unicode characters come out as 'z1234Uz5678U', we</span>
<a name="line-296"></a>  <span class='hs-comment'>-- could remove the 'U' in the middle (the 'z' works as a separator).</span>
<a name="line-297"></a>
<a name="line-298"></a><a name="zDecodeString"></a><span class='hs-definition'>zDecodeString</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>EncodedString</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>UserString</span>
<a name="line-299"></a><span class='hs-definition'>zDecodeString</span> <span class='hs-conid'>[]</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>[]</span>
<a name="line-300"></a><span class='hs-definition'>zDecodeString</span> <span class='hs-layout'>(</span><span class='hs-chr'>'Z'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>d</span> <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span>
<a name="line-301"></a>  <span class='hs-keyglyph'>|</span> <span class='hs-varid'>isDigit</span> <span class='hs-varid'>d</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>decode_tuple</span>   <span class='hs-varid'>d</span> <span class='hs-varid'>rest</span>
<a name="line-302"></a>  <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>decode_upper</span>   <span class='hs-varid'>d</span> <span class='hs-conop'>:</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span>
<a name="line-303"></a><span class='hs-definition'>zDecodeString</span> <span class='hs-layout'>(</span><span class='hs-chr'>'z'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>d</span> <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span>
<a name="line-304"></a>  <span class='hs-keyglyph'>|</span> <span class='hs-varid'>isDigit</span> <span class='hs-varid'>d</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>decode_num_esc</span> <span class='hs-varid'>d</span> <span class='hs-varid'>rest</span>
<a name="line-305"></a>  <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>decode_lower</span>   <span class='hs-varid'>d</span> <span class='hs-conop'>:</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span>
<a name="line-306"></a><span class='hs-definition'>zDecodeString</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span>   <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>c</span> <span class='hs-conop'>:</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span>
<a name="line-307"></a>
<a name="line-308"></a><a name="decode_upper"></a><span class='hs-definition'>decode_upper</span><span class='hs-layout'>,</span> <span class='hs-varid'>decode_lower</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Char</span>
<a name="line-309"></a>
<a name="line-310"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'L'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'('</span>
<a name="line-311"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'R'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>')'</span>
<a name="line-312"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'M'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'['</span>
<a name="line-313"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'N'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>']'</span>
<a name="line-314"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'C'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>':'</span>
<a name="line-315"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'Z'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'Z'</span>
<a name="line-316"></a><span class='hs-definition'>decode_upper</span> <span class='hs-varid'>ch</span>  <span class='hs-keyglyph'>=</span> <span class='hs-comment'>{-pprTrace "decode_upper" (char ch)-}</span> <span class='hs-varid'>ch</span>
<a name="line-317"></a>
<a name="line-318"></a><a name="decode_lower"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'z'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'z'</span>
<a name="line-319"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'a'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'&amp;'</span>
<a name="line-320"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'b'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'|'</span>
<a name="line-321"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'c'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'^'</span>
<a name="line-322"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'d'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'$'</span>
<a name="line-323"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'e'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'='</span>
<a name="line-324"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'g'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'&gt;'</span>
<a name="line-325"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'h'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'#'</span>
<a name="line-326"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'i'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'.'</span>
<a name="line-327"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'l'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'&lt;'</span>
<a name="line-328"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'m'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'-'</span>
<a name="line-329"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'n'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'!'</span>
<a name="line-330"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'p'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'+'</span>
<a name="line-331"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'q'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'\''</span>
<a name="line-332"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'r'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'\\'</span>
<a name="line-333"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'s'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'/'</span>
<a name="line-334"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'t'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'*'</span>
<a name="line-335"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'u'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'_'</span>
<a name="line-336"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'v'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'%'</span>
<a name="line-337"></a><span class='hs-definition'>decode_lower</span> <span class='hs-varid'>ch</span>  <span class='hs-keyglyph'>=</span> <span class='hs-comment'>{-pprTrace "decode_lower" (char ch)-}</span> <span class='hs-varid'>ch</span>
<a name="line-338"></a>
<a name="line-339"></a><a name="decode_num_esc"></a><span class='hs-comment'>-- Characters not having a specific code are coded as z224U (in hex)</span>
<a name="line-340"></a><span class='hs-definition'>decode_num_esc</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>EncodedString</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>UserString</span>
<a name="line-341"></a><span class='hs-definition'>decode_num_esc</span> <span class='hs-varid'>d</span> <span class='hs-varid'>rest</span>
<a name="line-342"></a>  <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>digitToInt</span> <span class='hs-varid'>d</span><span class='hs-layout'>)</span> <span class='hs-varid'>rest</span>
<a name="line-343"></a>  <span class='hs-keyword'>where</span>
<a name="line-344"></a>    <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span> <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>isHexDigit</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-num'>16</span><span class='hs-varop'>*</span><span class='hs-varid'>n</span> <span class='hs-varop'>+</span> <span class='hs-varid'>digitToInt</span> <span class='hs-varid'>c</span><span class='hs-layout'>)</span> <span class='hs-varid'>rest</span>
<a name="line-345"></a>    <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-chr'>'U'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span>           <span class='hs-keyglyph'>=</span> <span class='hs-varid'>chr</span> <span class='hs-varid'>n</span> <span class='hs-conop'>:</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span>
<a name="line-346"></a>    <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-varid'>other</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>error</span> <span class='hs-layout'>(</span><span class='hs-str'>"decode_num_esc: "</span> <span class='hs-varop'>++</span> <span class='hs-varid'>show</span> <span class='hs-varid'>n</span> <span class='hs-varop'>++</span>  <span class='hs-chr'>' '</span><span class='hs-conop'>:</span><span class='hs-varid'>other</span><span class='hs-layout'>)</span>
<a name="line-347"></a>
<a name="line-348"></a><a name="decode_tuple"></a><span class='hs-definition'>decode_tuple</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>EncodedString</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>UserString</span>
<a name="line-349"></a><span class='hs-definition'>decode_tuple</span> <span class='hs-varid'>d</span> <span class='hs-varid'>rest</span>
<a name="line-350"></a>  <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>digitToInt</span> <span class='hs-varid'>d</span><span class='hs-layout'>)</span> <span class='hs-varid'>rest</span>
<a name="line-351"></a>  <span class='hs-keyword'>where</span>
<a name="line-352"></a>        <span class='hs-comment'>-- NB. recurse back to zDecodeString after decoding the tuple, because</span>
<a name="line-353"></a>        <span class='hs-comment'>-- the tuple might be embedded in a longer name.</span>
<a name="line-354"></a>    <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span> <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>isDigit</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-num'>10</span><span class='hs-varop'>*</span><span class='hs-varid'>n</span> <span class='hs-varop'>+</span> <span class='hs-varid'>digitToInt</span> <span class='hs-varid'>c</span><span class='hs-layout'>)</span> <span class='hs-varid'>rest</span>
<a name="line-355"></a>    <span class='hs-varid'>go</span> <span class='hs-num'>0</span> <span class='hs-layout'>(</span><span class='hs-chr'>'T'</span><span class='hs-conop'>:</span><span class='hs-varid'>rest</span><span class='hs-layout'>)</span>     <span class='hs-keyglyph'>=</span> <span class='hs-str'>"()"</span> <span class='hs-varop'>++</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span>
<a name="line-356"></a>    <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-chr'>'T'</span><span class='hs-conop'>:</span><span class='hs-varid'>rest</span><span class='hs-layout'>)</span>     <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'('</span> <span class='hs-conop'>:</span> <span class='hs-varid'>replicate</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-comment'>-</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-chr'>','</span> <span class='hs-varop'>++</span> <span class='hs-str'>")"</span> <span class='hs-varop'>++</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span>
<a name="line-357"></a>    <span class='hs-varid'>go</span> <span class='hs-num'>1</span> <span class='hs-layout'>(</span><span class='hs-chr'>'H'</span><span class='hs-conop'>:</span><span class='hs-varid'>rest</span><span class='hs-layout'>)</span>     <span class='hs-keyglyph'>=</span> <span class='hs-str'>"(# #)"</span> <span class='hs-varop'>++</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span>
<a name="line-358"></a>    <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-chr'>'H'</span><span class='hs-conop'>:</span><span class='hs-varid'>rest</span><span class='hs-layout'>)</span>     <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'('</span> <span class='hs-conop'>:</span> <span class='hs-chr'>'#'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>replicate</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-comment'>-</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-chr'>','</span> <span class='hs-varop'>++</span> <span class='hs-str'>"#)"</span> <span class='hs-varop'>++</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span>
<a name="line-359"></a>    <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-varid'>other</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>error</span> <span class='hs-layout'>(</span><span class='hs-str'>"decode_tuple: "</span> <span class='hs-varop'>++</span> <span class='hs-varid'>show</span> <span class='hs-varid'>n</span> <span class='hs-varop'>++</span> <span class='hs-chr'>' '</span><span class='hs-conop'>:</span><span class='hs-varid'>other</span><span class='hs-layout'>)</span>
<a name="line-360"></a>
<a name="line-361"></a><span class='hs-comment'>{-
<a name="line-362"></a>Tuples are encoded as
<a name="line-363"></a>        Z3T or Z3H
<a name="line-364"></a>for 3-tuples or unboxed 3-tuples respectively.  No other encoding starts
<a name="line-365"></a>        Z&lt;digit&gt;
<a name="line-366"></a>
<a name="line-367"></a>* "(# #)" is the tycon for an unboxed 1-tuple (not 0-tuple)
<a name="line-368"></a>  There are no unboxed 0-tuples.
<a name="line-369"></a>
<a name="line-370"></a>* "()" is the tycon for a boxed 0-tuple.
<a name="line-371"></a>  There are no boxed 1-tuples.
<a name="line-372"></a>-}</span>
<a name="line-373"></a>
<a name="line-374"></a><a name="maybe_tuple"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>UserString</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Maybe</span> <span class='hs-conid'>EncodedString</span>
<a name="line-375"></a>
<a name="line-376"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-str'>"(# #)"</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>Just</span><span class='hs-layout'>(</span><span class='hs-str'>"Z1H"</span><span class='hs-layout'>)</span>
<a name="line-377"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-layout'>(</span><span class='hs-chr'>'('</span> <span class='hs-conop'>:</span> <span class='hs-chr'>'#'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>case</span> <span class='hs-varid'>count_commas</span> <span class='hs-layout'>(</span><span class='hs-num'>0</span><span class='hs-keyglyph'>::</span><span class='hs-conid'>Int</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span> <span class='hs-keyword'>of</span>
<a name="line-378"></a>                                 <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-layout'>,</span> <span class='hs-chr'>'#'</span> <span class='hs-conop'>:</span> <span class='hs-chr'>')'</span> <span class='hs-conop'>:</span> <span class='hs-keyword'>_</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Just</span> <span class='hs-layout'>(</span><span class='hs-chr'>'Z'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>shows</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-str'>"H"</span><span class='hs-layout'>)</span>
<a name="line-379"></a>                                 <span class='hs-keyword'>_</span>                  <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Nothing</span>
<a name="line-380"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-str'>"()"</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>Just</span><span class='hs-layout'>(</span><span class='hs-str'>"Z0T"</span><span class='hs-layout'>)</span>
<a name="line-381"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-layout'>(</span><span class='hs-chr'>'('</span> <span class='hs-conop'>:</span> <span class='hs-varid'>cs</span><span class='hs-layout'>)</span>       <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>case</span> <span class='hs-varid'>count_commas</span> <span class='hs-layout'>(</span><span class='hs-num'>0</span><span class='hs-keyglyph'>::</span><span class='hs-conid'>Int</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span> <span class='hs-keyword'>of</span>
<a name="line-382"></a>                                 <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-layout'>,</span> <span class='hs-chr'>')'</span> <span class='hs-conop'>:</span> <span class='hs-keyword'>_</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Just</span> <span class='hs-layout'>(</span><span class='hs-chr'>'Z'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>shows</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-str'>"T"</span><span class='hs-layout'>)</span>
<a name="line-383"></a>                                 <span class='hs-keyword'>_</span>            <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>Nothing</span>
<a name="line-384"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-keyword'>_</span>                <span class='hs-keyglyph'>=</span> <span class='hs-conid'>Nothing</span>
<a name="line-385"></a>
<a name="line-386"></a><a name="count_commas"></a><span class='hs-definition'>count_commas</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Int</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-conid'>String</span> <span class='hs-keyglyph'>-&gt;</span> <span class='hs-layout'>(</span><span class='hs-conid'>Int</span><span class='hs-layout'>,</span> <span class='hs-conid'>String</span><span class='hs-layout'>)</span>
<a name="line-387"></a><span class='hs-definition'>count_commas</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-chr'>','</span> <span class='hs-conop'>:</span> <span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>count_commas</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span>
<a name="line-388"></a><span class='hs-definition'>count_commas</span> <span class='hs-varid'>n</span> <span class='hs-varid'>cs</span>         <span class='hs-keyglyph'>=</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-layout'>,</span><span class='hs-varid'>cs</span><span class='hs-layout'>)</span>
</pre></body>
</html>