<?xml version="1.0" encoding="UTF-8"?> <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> <html> <head> <!-- Generated by HsColour, http://www.cs.york.ac.uk/fp/darcs/hscolour/ --> <title>utils/Encoding.hs</title> <link type='text/css' rel='stylesheet' href='hscolour.css' /> </head> <body> <pre><a name="line-1"></a><span class='hs-comment'>{-# OPTIONS_GHC -O #-}</span> <a name="line-2"></a><span class='hs-comment'>-- We always optimise this, otherwise performance of a non-optimised</span> <a name="line-3"></a><span class='hs-comment'>-- compiler is severely affected</span> <a name="line-4"></a> <a name="line-5"></a><span class='hs-comment'>-- -----------------------------------------------------------------------------</span> <a name="line-6"></a><span class='hs-comment'>--</span> <a name="line-7"></a><span class='hs-comment'>-- (c) The University of Glasgow, 1997-2006</span> <a name="line-8"></a><span class='hs-comment'>--</span> <a name="line-9"></a><span class='hs-comment'>-- Character encodings</span> <a name="line-10"></a><span class='hs-comment'>--</span> <a name="line-11"></a><span class='hs-comment'>-- -----------------------------------------------------------------------------</span> <a name="line-12"></a> <a name="line-13"></a><span class='hs-keyword'>module</span> <span class='hs-conid'>Encoding</span> <span class='hs-layout'>(</span> <a name="line-14"></a> <span class='hs-comment'>-- * UTF-8</span> <a name="line-15"></a> <span class='hs-varid'>utf8DecodeChar</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <a name="line-16"></a> <span class='hs-varid'>utf8PrevChar</span><span class='hs-layout'>,</span> <a name="line-17"></a> <span class='hs-varid'>utf8CharStart</span><span class='hs-layout'>,</span> <a name="line-18"></a> <span class='hs-varid'>utf8DecodeChar</span><span class='hs-layout'>,</span> <a name="line-19"></a> <span class='hs-varid'>utf8DecodeString</span><span class='hs-layout'>,</span> <a name="line-20"></a> <span class='hs-varid'>utf8EncodeChar</span><span class='hs-layout'>,</span> <a name="line-21"></a> <span class='hs-varid'>utf8EncodeString</span><span class='hs-layout'>,</span> <a name="line-22"></a> <span class='hs-varid'>utf8EncodedLength</span><span class='hs-layout'>,</span> <a name="line-23"></a> <span class='hs-varid'>countUTF8Chars</span><span class='hs-layout'>,</span> <a name="line-24"></a> <a name="line-25"></a> <span class='hs-comment'>-- * Z-encoding</span> <a name="line-26"></a> <span class='hs-varid'>zEncodeString</span><span class='hs-layout'>,</span> <a name="line-27"></a> <span class='hs-varid'>zDecodeString</span> <a name="line-28"></a> <span class='hs-layout'>)</span> <span class='hs-keyword'>where</span> <a name="line-29"></a> <a name="line-30"></a><span class='hs-cpp'>#include "HsVersions.h"</span> <a name="line-31"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Foreign</span> <a name="line-32"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>Char</span> <a name="line-33"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Numeric</span> <a name="line-34"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>GHC</span><span class='hs-varop'>.</span><span class='hs-conid'>Ptr</span> <span class='hs-layout'>(</span> <span class='hs-conid'>Ptr</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span> <span class='hs-layout'>)</span> <a name="line-35"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>GHC</span><span class='hs-varop'>.</span><span class='hs-conid'>Base</span> <a name="line-36"></a> <a name="line-37"></a><span class='hs-comment'>-- -----------------------------------------------------------------------------</span> <a name="line-38"></a><span class='hs-comment'>-- UTF-8</span> <a name="line-39"></a> <a name="line-40"></a><span class='hs-comment'>-- We can't write the decoder as efficiently as we'd like without</span> <a name="line-41"></a><span class='hs-comment'>-- resorting to unboxed extensions, unfortunately. I tried to write</span> <a name="line-42"></a><span class='hs-comment'>-- an IO version of this function, but GHC can't eliminate boxed</span> <a name="line-43"></a><span class='hs-comment'>-- results from an IO-returning function.</span> <a name="line-44"></a><span class='hs-comment'>--</span> <a name="line-45"></a><span class='hs-comment'>-- We assume we can ignore overflow when parsing a multibyte character here.</span> <a name="line-46"></a><span class='hs-comment'>-- To make this safe, we add extra sentinel bytes to unparsed UTF-8 sequences</span> <a name="line-47"></a><span class='hs-comment'>-- before decoding them (see StringBuffer.hs).</span> <a name="line-48"></a> <a name="line-49"></a><a name="utf8DecodeChar"></a><span class='hs-comment'>{-# INLINE utf8DecodeChar# #-}</span> <a name="line-50"></a><span class='hs-definition'>utf8DecodeChar</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Addr</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>-></span> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-conid'>Char</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-conid'>Addr</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <a name="line-51"></a><span class='hs-definition'>utf8DecodeChar</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>=</span> <a name="line-52"></a> <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch0</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>0</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span> <a name="line-53"></a> <span class='hs-keyword'>case</span> <span class='hs-conid'>()</span> <span class='hs-keyword'>of</span> <a name="line-54"></a> <span class='hs-keyword'>_</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'><=#</span> <span class='hs-num'>0x7F</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>-></span> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>chr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>ch0</span><span class='hs-layout'>,</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <a name="line-55"></a> <a name="line-56"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'>>=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-varop'>&&</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'><=#</span> <span class='hs-num'>0xDF</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>-></span> <a name="line-57"></a> <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch1</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span> <a name="line-58"></a> <span class='hs-keyword'>if</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'><#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'>>=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span> <a name="line-59"></a> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>chr</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch0</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>6</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>+#</span> <a name="line-60"></a> <span class='hs-layout'>(</span><span class='hs-varid'>ch1</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span> <a name="line-61"></a> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>2</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <a name="line-62"></a> <a name="line-63"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'>>=#</span> <span class='hs-num'>0xE0</span><span class='hs-cpp'>#</span> <span class='hs-varop'>&&</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'><=#</span> <span class='hs-num'>0xEF</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>-></span> <a name="line-64"></a> <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch1</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span> <a name="line-65"></a> <span class='hs-keyword'>if</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'><#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'>>=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span> <a name="line-66"></a> <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch2</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>2</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span> <a name="line-67"></a> <span class='hs-keyword'>if</span> <span class='hs-varid'>ch2</span> <span class='hs-varop'><#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch2</span> <span class='hs-varop'>>=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>2</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span> <a name="line-68"></a> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>chr</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch0</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0xE0</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>12</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>+#</span> <a name="line-69"></a> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch1</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>6</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>+#</span> <a name="line-70"></a> <span class='hs-layout'>(</span><span class='hs-varid'>ch2</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span> <a name="line-71"></a> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>3</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <a name="line-72"></a> <a name="line-73"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'>>=#</span> <span class='hs-num'>0xF0</span><span class='hs-cpp'>#</span> <span class='hs-varop'>&&</span> <span class='hs-varid'>ch0</span> <span class='hs-varop'><=#</span> <span class='hs-num'>0xF8</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>-></span> <a name="line-74"></a> <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch1</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span> <a name="line-75"></a> <span class='hs-keyword'>if</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'><#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch1</span> <span class='hs-varop'>>=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span> <a name="line-76"></a> <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch2</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>2</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span> <a name="line-77"></a> <span class='hs-keyword'>if</span> <span class='hs-varid'>ch2</span> <span class='hs-varop'><#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch2</span> <span class='hs-varop'>>=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>2</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span> <a name="line-78"></a> <span class='hs-keyword'>let</span> <span class='hs-varop'>!</span><span class='hs-varid'>ch3</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>word2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>indexWord8OffAddr</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-num'>3</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyword'>in</span> <a name="line-79"></a> <span class='hs-keyword'>if</span> <span class='hs-varid'>ch3</span> <span class='hs-varop'><#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span> <span class='hs-varop'>||</span> <span class='hs-varid'>ch3</span> <span class='hs-varop'>>=#</span> <span class='hs-num'>0xC0</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>fail</span> <span class='hs-num'>3</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>else</span> <a name="line-80"></a> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>chr</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch0</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0xF0</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>18</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>+#</span> <a name="line-81"></a> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch1</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>12</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>+#</span> <a name="line-82"></a> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>ch2</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>`</span><span class='hs-varid'>uncheckedIShiftL</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>6</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-varop'>+#</span> <a name="line-83"></a> <span class='hs-layout'>(</span><span class='hs-varid'>ch3</span> <span class='hs-varop'>-#</span> <span class='hs-num'>0x80</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span> <a name="line-84"></a> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-num'>4</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <a name="line-85"></a> <a name="line-86"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>-></span> <span class='hs-varid'>fail</span> <span class='hs-num'>1</span><span class='hs-cpp'>#</span> <a name="line-87"></a> <span class='hs-keyword'>where</span> <a name="line-88"></a> <span class='hs-comment'>-- all invalid sequences end up here:</span> <a name="line-89"></a> <span class='hs-varid'>fail</span> <span class='hs-varid'>n</span> <span class='hs-keyglyph'>=</span> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-chr'>'\0'</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-varid'>n</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <a name="line-90"></a> <span class='hs-comment'>-- '\xFFFD' would be the usual replacement character, but</span> <a name="line-91"></a> <span class='hs-comment'>-- that's a valid symbol in Haskell, so will result in a</span> <a name="line-92"></a> <span class='hs-comment'>-- confusing parse error later on. Instead we use '\0' which</span> <a name="line-93"></a> <span class='hs-comment'>-- will signal a lexer error immediately.</span> <a name="line-94"></a> <a name="line-95"></a><span class='hs-definition'>utf8DecodeChar</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-></span> <span class='hs-layout'>(</span><span class='hs-conid'>Char</span><span class='hs-layout'>,</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span><span class='hs-layout'>)</span> <a name="line-96"></a><span class='hs-definition'>utf8DecodeChar</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <a name="line-97"></a> <span class='hs-keyword'>case</span> <span class='hs-varid'>utf8DecodeChar</span><span class='hs-cpp'>#</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>of</span> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>c</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-varid'>b</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-></span> <span class='hs-layout'>(</span> <span class='hs-conid'>C</span><span class='hs-cpp'>#</span> <span class='hs-varid'>c</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-conid'>Ptr</span> <span class='hs-varid'>b</span><span class='hs-cpp'>#</span> <span class='hs-layout'>)</span> <a name="line-98"></a> <a name="line-99"></a><a name="utf8PrevChar"></a><span class='hs-comment'>-- UTF-8 is cleverly designed so that we can always figure out where</span> <a name="line-100"></a><span class='hs-comment'>-- the start of the current character is, given any position in a</span> <a name="line-101"></a><span class='hs-comment'>-- stream. This function finds the start of the previous character,</span> <a name="line-102"></a><span class='hs-comment'>-- assuming there *is* a previous character.</span> <a name="line-103"></a><span class='hs-definition'>utf8PrevChar</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>IO</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span><span class='hs-layout'>)</span> <a name="line-104"></a><span class='hs-definition'>utf8PrevChar</span> <span class='hs-varid'>p</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>utf8CharStart</span> <span class='hs-layout'>(</span><span class='hs-varid'>p</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-layout'>(</span><span class='hs-comment'>-</span><span class='hs-num'>1</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-105"></a> <a name="line-106"></a><a name="utf8CharStart"></a><span class='hs-definition'>utf8CharStart</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>IO</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span><span class='hs-layout'>)</span> <a name="line-107"></a><span class='hs-definition'>utf8CharStart</span> <span class='hs-varid'>p</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-varid'>p</span> <a name="line-108"></a> <span class='hs-keyword'>where</span> <span class='hs-varid'>go</span> <span class='hs-varid'>p</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>do</span> <span class='hs-varid'>w</span> <span class='hs-keyglyph'><-</span> <span class='hs-varid'>peek</span> <span class='hs-varid'>p</span> <a name="line-109"></a> <span class='hs-keyword'>if</span> <span class='hs-varid'>w</span> <span class='hs-varop'>>=</span> <span class='hs-num'>0x80</span> <span class='hs-varop'>&&</span> <span class='hs-varid'>w</span> <span class='hs-varop'><</span> <span class='hs-num'>0xC0</span> <a name="line-110"></a> <span class='hs-keyword'>then</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>p</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-layout'>(</span><span class='hs-comment'>-</span><span class='hs-num'>1</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-111"></a> <span class='hs-keyword'>else</span> <span class='hs-varid'>return</span> <span class='hs-varid'>p</span> <a name="line-112"></a> <a name="line-113"></a><a name="utf8DecodeString"></a><span class='hs-definition'>utf8DecodeString</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Int</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>IO</span> <span class='hs-keyglyph'>[</span><span class='hs-conid'>Char</span><span class='hs-keyglyph'>]</span> <a name="line-114"></a><span class='hs-conid'>STRICT2</span><span class='hs-layout'>(</span><span class='hs-varid'>utf8DecodeString</span><span class='hs-layout'>)</span> <a name="line-115"></a><span class='hs-definition'>utf8DecodeString</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-layout'>(</span><span class='hs-conid'>I</span><span class='hs-cpp'>#</span> <span class='hs-varid'>len</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <a name="line-116"></a> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>unpack</span> <span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <a name="line-117"></a> <span class='hs-keyword'>where</span> <a name="line-118"></a> <span class='hs-varop'>!</span><span class='hs-varid'>end</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>addr2Int</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>a</span><span class='hs-cpp'>#</span> <span class='hs-varop'>`</span><span class='hs-varid'>plusAddr</span><span class='hs-cpp'>#</span><span class='hs-varop'>`</span> <span class='hs-varid'>len</span><span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <a name="line-119"></a> <a name="line-120"></a> <span class='hs-varid'>unpack</span> <span class='hs-varid'>p</span><span class='hs-cpp'>#</span> <a name="line-121"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>addr2Int</span><span class='hs-cpp'>#</span> <span class='hs-varid'>p</span><span class='hs-cpp'>#</span> <span class='hs-varop'>>=#</span> <span class='hs-varid'>end</span><span class='hs-cpp'>#</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>return</span> <span class='hs-conid'>[]</span> <a name="line-122"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>=</span> <a name="line-123"></a> <span class='hs-keyword'>case</span> <span class='hs-varid'>utf8DecodeChar</span><span class='hs-cpp'>#</span> <span class='hs-varid'>p</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>of</span> <a name="line-124"></a> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-varid'>c</span><span class='hs-cpp'>#</span><span class='hs-layout'>,</span> <span class='hs-varid'>q</span><span class='hs-cpp'>#</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-></span> <span class='hs-keyword'>do</span> <a name="line-125"></a> <span class='hs-varid'>chs</span> <span class='hs-keyglyph'><-</span> <span class='hs-varid'>unpack</span> <span class='hs-varid'>q</span><span class='hs-cpp'>#</span> <a name="line-126"></a> <span class='hs-varid'>return</span> <span class='hs-layout'>(</span><span class='hs-conid'>C</span><span class='hs-cpp'>#</span> <span class='hs-varid'>c</span><span class='hs-cpp'>#</span> <span class='hs-conop'>:</span> <span class='hs-varid'>chs</span><span class='hs-layout'>)</span> <a name="line-127"></a> <a name="line-128"></a><a name="countUTF8Chars"></a><span class='hs-definition'>countUTF8Chars</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Int</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>IO</span> <span class='hs-conid'>Int</span> <a name="line-129"></a><span class='hs-definition'>countUTF8Chars</span> <span class='hs-varid'>ptr</span> <span class='hs-varid'>bytes</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>0</span> <a name="line-130"></a> <span class='hs-keyword'>where</span> <a name="line-131"></a> <span class='hs-varid'>end</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>ptr</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-varid'>bytes</span> <a name="line-132"></a> <a name="line-133"></a> <span class='hs-conid'>STRICT2</span><span class='hs-layout'>(</span><span class='hs-varid'>go</span><span class='hs-layout'>)</span> <a name="line-134"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>ptr</span> <span class='hs-varid'>n</span> <a name="line-135"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ptr</span> <span class='hs-varop'>>=</span> <span class='hs-varid'>end</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>return</span> <span class='hs-varid'>n</span> <a name="line-136"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>do</span> <a name="line-137"></a> <span class='hs-keyword'>case</span> <span class='hs-varid'>utf8DecodeChar</span><span class='hs-cpp'>#</span> <span class='hs-layout'>(</span><span class='hs-varid'>unPtr</span> <span class='hs-varid'>ptr</span><span class='hs-layout'>)</span> <span class='hs-keyword'>of</span> <a name="line-138"></a> <span class='hs-layout'>(</span><span class='hs-cpp'>#</span> <span class='hs-keyword'>_</span><span class='hs-layout'>,</span> <span class='hs-varid'>a</span> <span class='hs-cpp'>#</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-></span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-varid'>a</span><span class='hs-layout'>)</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <a name="line-139"></a> <a name="line-140"></a><a name="unPtr"></a><span class='hs-definition'>unPtr</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-varid'>a</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Addr</span><span class='hs-cpp'>#</span> <a name="line-141"></a><span class='hs-definition'>unPtr</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-varid'>a</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>a</span> <a name="line-142"></a> <a name="line-143"></a><a name="utf8EncodeChar"></a><span class='hs-definition'>utf8EncodeChar</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>IO</span> <span class='hs-layout'>(</span><span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span><span class='hs-layout'>)</span> <a name="line-144"></a><span class='hs-definition'>utf8EncodeChar</span> <span class='hs-varid'>c</span> <span class='hs-varid'>ptr</span> <span class='hs-keyglyph'>=</span> <a name="line-145"></a> <span class='hs-keyword'>let</span> <span class='hs-varid'>x</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>ord</span> <span class='hs-varid'>c</span> <span class='hs-keyword'>in</span> <a name="line-146"></a> <span class='hs-keyword'>case</span> <span class='hs-conid'>()</span> <span class='hs-keyword'>of</span> <a name="line-147"></a> <span class='hs-keyword'>_</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>x</span> <span class='hs-varop'>></span> <span class='hs-num'>0</span> <span class='hs-varop'>&&</span> <span class='hs-varid'>x</span> <span class='hs-varop'><=</span> <span class='hs-num'>0x007f</span> <span class='hs-keyglyph'>-></span> <span class='hs-keyword'>do</span> <a name="line-148"></a> <span class='hs-varid'>poke</span> <span class='hs-varid'>ptr</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-varid'>x</span><span class='hs-layout'>)</span> <a name="line-149"></a> <span class='hs-varid'>return</span> <span class='hs-layout'>(</span><span class='hs-varid'>ptr</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-num'>1</span><span class='hs-layout'>)</span> <a name="line-150"></a> <span class='hs-comment'>-- NB. '\0' is encoded as '\xC0\x80', not '\0'. This is so that we</span> <a name="line-151"></a> <span class='hs-comment'>-- can have 0-terminated UTF-8 strings (see GHC.Base.unpackCStringUtf8).</span> <a name="line-152"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>x</span> <span class='hs-varop'><=</span> <span class='hs-num'>0x07ff</span> <span class='hs-keyglyph'>-></span> <span class='hs-keyword'>do</span> <a name="line-153"></a> <span class='hs-varid'>poke</span> <span class='hs-varid'>ptr</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0xC0</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>6</span><span class='hs-layout'>)</span> <span class='hs-varop'>.&.</span> <span class='hs-num'>0x1F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-154"></a> <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>1</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>.&.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-155"></a> <span class='hs-varid'>return</span> <span class='hs-layout'>(</span><span class='hs-varid'>ptr</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-num'>2</span><span class='hs-layout'>)</span> <a name="line-156"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>x</span> <span class='hs-varop'><=</span> <span class='hs-num'>0xffff</span> <span class='hs-keyglyph'>-></span> <span class='hs-keyword'>do</span> <a name="line-157"></a> <span class='hs-varid'>poke</span> <span class='hs-varid'>ptr</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0xE0</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>12</span><span class='hs-layout'>)</span> <span class='hs-varop'>.&.</span> <span class='hs-num'>0x0F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-158"></a> <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>1</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>6</span><span class='hs-layout'>)</span> <span class='hs-varop'>.&.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-159"></a> <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>2</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>.&.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-160"></a> <span class='hs-varid'>return</span> <span class='hs-layout'>(</span><span class='hs-varid'>ptr</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-num'>3</span><span class='hs-layout'>)</span> <a name="line-161"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>-></span> <span class='hs-keyword'>do</span> <a name="line-162"></a> <span class='hs-varid'>poke</span> <span class='hs-varid'>ptr</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0xF0</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>18</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-163"></a> <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>1</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>12</span><span class='hs-layout'>)</span> <span class='hs-varop'>.&.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-164"></a> <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>2</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>`shiftR`</span> <span class='hs-num'>6</span><span class='hs-layout'>)</span> <span class='hs-varop'>.&.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-165"></a> <span class='hs-varid'>pokeElemOff</span> <span class='hs-varid'>ptr</span> <span class='hs-num'>3</span> <span class='hs-layout'>(</span><span class='hs-varid'>fromIntegral</span> <span class='hs-layout'>(</span><span class='hs-num'>0x80</span> <span class='hs-varop'>.|.</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span> <span class='hs-varop'>.&.</span> <span class='hs-num'>0x3F</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-166"></a> <span class='hs-varid'>return</span> <span class='hs-layout'>(</span><span class='hs-varid'>ptr</span> <span class='hs-varop'>`plusPtr`</span> <span class='hs-num'>4</span><span class='hs-layout'>)</span> <a name="line-167"></a> <a name="line-168"></a><a name="utf8EncodeString"></a><span class='hs-definition'>utf8EncodeString</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Ptr</span> <span class='hs-conid'>Word8</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>String</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>IO</span> <span class='hs-conid'>()</span> <a name="line-169"></a><span class='hs-definition'>utf8EncodeString</span> <span class='hs-varid'>ptr</span> <span class='hs-varid'>str</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-varid'>ptr</span> <span class='hs-varid'>str</span> <a name="line-170"></a> <span class='hs-keyword'>where</span> <span class='hs-conid'>STRICT2</span><span class='hs-layout'>(</span><span class='hs-varid'>go</span><span class='hs-layout'>)</span> <a name="line-171"></a> <span class='hs-varid'>go</span> <span class='hs-keyword'>_</span> <span class='hs-conid'>[]</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>return</span> <span class='hs-conid'>()</span> <a name="line-172"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>ptr</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span><span class='hs-conop'>:</span><span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>do</span> <a name="line-173"></a> <span class='hs-varid'>ptr'</span> <span class='hs-keyglyph'><-</span> <span class='hs-varid'>utf8EncodeChar</span> <span class='hs-varid'>c</span> <span class='hs-varid'>ptr</span> <a name="line-174"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>ptr'</span> <span class='hs-varid'>cs</span> <a name="line-175"></a> <a name="line-176"></a><a name="utf8EncodedLength"></a><span class='hs-definition'>utf8EncodedLength</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>String</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Int</span> <a name="line-177"></a><span class='hs-definition'>utf8EncodedLength</span> <span class='hs-varid'>str</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-num'>0</span> <span class='hs-varid'>str</span> <a name="line-178"></a> <span class='hs-keyword'>where</span> <span class='hs-conid'>STRICT2</span><span class='hs-layout'>(</span><span class='hs-varid'>go</span><span class='hs-layout'>)</span> <a name="line-179"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-conid'>[]</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>n</span> <a name="line-180"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span><span class='hs-conop'>:</span><span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <a name="line-181"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ord</span> <span class='hs-varid'>c</span> <span class='hs-varop'>></span> <span class='hs-num'>0</span> <span class='hs-varop'>&&</span> <span class='hs-varid'>ord</span> <span class='hs-varid'>c</span> <span class='hs-varop'><=</span> <span class='hs-num'>0x007f</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span> <a name="line-182"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ord</span> <span class='hs-varid'>c</span> <span class='hs-varop'><=</span> <span class='hs-num'>0x07ff</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>2</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span> <a name="line-183"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>ord</span> <span class='hs-varid'>c</span> <span class='hs-varop'><=</span> <span class='hs-num'>0xffff</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>3</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span> <a name="line-184"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>4</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span> <a name="line-185"></a> <a name="line-186"></a><span class='hs-comment'>-- -----------------------------------------------------------------------------</span> <a name="line-187"></a><span class='hs-comment'>-- The Z-encoding</span> <a name="line-188"></a> <a name="line-189"></a><span class='hs-comment'>{- <a name="line-190"></a>This is the main name-encoding and decoding function. It encodes any <a name="line-191"></a>string into a string that is acceptable as a C name. This is done <a name="line-192"></a>right before we emit a symbol name into the compiled C or asm code. <a name="line-193"></a>Z-encoding of strings is cached in the FastString interface, so we <a name="line-194"></a>never encode the same string more than once. <a name="line-195"></a> <a name="line-196"></a>The basic encoding scheme is this. <a name="line-197"></a> <a name="line-198"></a>* Tuples (,,,) are coded as Z3T <a name="line-199"></a> <a name="line-200"></a>* Alphabetic characters (upper and lower) and digits <a name="line-201"></a> all translate to themselves; <a name="line-202"></a> except 'Z', which translates to 'ZZ' <a name="line-203"></a> and 'z', which translates to 'zz' <a name="line-204"></a> We need both so that we can preserve the variable/tycon distinction <a name="line-205"></a> <a name="line-206"></a>* Most other printable characters translate to 'zx' or 'Zx' for some <a name="line-207"></a> alphabetic character x <a name="line-208"></a> <a name="line-209"></a>* The others translate as 'znnnU' where 'nnn' is the decimal number <a name="line-210"></a> of the character <a name="line-211"></a> <a name="line-212"></a> Before After <a name="line-213"></a> -------------------------- <a name="line-214"></a> Trak Trak <a name="line-215"></a> foo_wib foozuwib <a name="line-216"></a> > zg <a name="line-217"></a> >1 zg1 <a name="line-218"></a> foo# foozh <a name="line-219"></a> foo## foozhzh <a name="line-220"></a> foo##1 foozhzh1 <a name="line-221"></a> fooZ fooZZ <a name="line-222"></a> :+ ZCzp <a name="line-223"></a> () Z0T 0-tuple <a name="line-224"></a> (,,,,) Z5T 5-tuple <a name="line-225"></a> (# #) Z1H unboxed 1-tuple (note the space) <a name="line-226"></a> (#,,,,#) Z5H unboxed 5-tuple <a name="line-227"></a> (NB: There is no Z1T nor Z0H.) <a name="line-228"></a>-}</span> <a name="line-229"></a> <a name="line-230"></a><a name="UserString"></a><span class='hs-keyword'>type</span> <span class='hs-conid'>UserString</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>String</span> <span class='hs-comment'>-- As the user typed it</span> <a name="line-231"></a><a name="EncodedString"></a><span class='hs-keyword'>type</span> <span class='hs-conid'>EncodedString</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>String</span> <span class='hs-comment'>-- Encoded form</span> <a name="line-232"></a> <a name="line-233"></a> <a name="line-234"></a><a name="zEncodeString"></a><span class='hs-definition'>zEncodeString</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>UserString</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>EncodedString</span> <a name="line-235"></a><span class='hs-definition'>zEncodeString</span> <span class='hs-varid'>cs</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>case</span> <span class='hs-varid'>maybe_tuple</span> <span class='hs-varid'>cs</span> <span class='hs-keyword'>of</span> <a name="line-236"></a> <span class='hs-conid'>Just</span> <span class='hs-varid'>n</span> <span class='hs-keyglyph'>-></span> <span class='hs-varid'>n</span> <span class='hs-comment'>-- Tuples go to Z2T etc</span> <a name="line-237"></a> <span class='hs-conid'>Nothing</span> <span class='hs-keyglyph'>-></span> <span class='hs-varid'>go</span> <span class='hs-varid'>cs</span> <a name="line-238"></a> <span class='hs-keyword'>where</span> <a name="line-239"></a> <span class='hs-varid'>go</span> <span class='hs-conid'>[]</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>[]</span> <a name="line-240"></a> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span><span class='hs-conop'>:</span><span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>encode_digit_ch</span> <span class='hs-varid'>c</span> <span class='hs-varop'>++</span> <span class='hs-varid'>go'</span> <span class='hs-varid'>cs</span> <a name="line-241"></a> <span class='hs-varid'>go'</span> <span class='hs-conid'>[]</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>[]</span> <a name="line-242"></a> <span class='hs-varid'>go'</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span><span class='hs-conop'>:</span><span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>encode_ch</span> <span class='hs-varid'>c</span> <span class='hs-varop'>++</span> <span class='hs-varid'>go'</span> <span class='hs-varid'>cs</span> <a name="line-243"></a> <a name="line-244"></a><a name="unencodedChar"></a><span class='hs-definition'>unencodedChar</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Bool</span> <span class='hs-comment'>-- True for chars that don't need encoding</span> <a name="line-245"></a><span class='hs-definition'>unencodedChar</span> <span class='hs-chr'>'Z'</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>False</span> <a name="line-246"></a><span class='hs-definition'>unencodedChar</span> <span class='hs-chr'>'z'</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>False</span> <a name="line-247"></a><span class='hs-definition'>unencodedChar</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>c</span> <span class='hs-varop'>>=</span> <span class='hs-chr'>'a'</span> <span class='hs-varop'>&&</span> <span class='hs-varid'>c</span> <span class='hs-varop'><=</span> <span class='hs-chr'>'z'</span> <a name="line-248"></a> <span class='hs-varop'>||</span> <span class='hs-varid'>c</span> <span class='hs-varop'>>=</span> <span class='hs-chr'>'A'</span> <span class='hs-varop'>&&</span> <span class='hs-varid'>c</span> <span class='hs-varop'><=</span> <span class='hs-chr'>'Z'</span> <a name="line-249"></a> <span class='hs-varop'>||</span> <span class='hs-varid'>c</span> <span class='hs-varop'>>=</span> <span class='hs-chr'>'0'</span> <span class='hs-varop'>&&</span> <span class='hs-varid'>c</span> <span class='hs-varop'><=</span> <span class='hs-chr'>'9'</span> <a name="line-250"></a> <a name="line-251"></a><a name="encode_digit_ch"></a><span class='hs-comment'>-- If a digit is at the start of a symbol then we need to encode it.</span> <a name="line-252"></a><span class='hs-comment'>-- Otherwise package names like 9pH-0.1 give linker errors.</span> <a name="line-253"></a><span class='hs-definition'>encode_digit_ch</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>EncodedString</span> <a name="line-254"></a><span class='hs-definition'>encode_digit_ch</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>c</span> <span class='hs-varop'>>=</span> <span class='hs-chr'>'0'</span> <span class='hs-varop'>&&</span> <span class='hs-varid'>c</span> <span class='hs-varop'><=</span> <span class='hs-chr'>'9'</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>encode_as_unicode_char</span> <span class='hs-varid'>c</span> <a name="line-255"></a><span class='hs-definition'>encode_digit_ch</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>encode_ch</span> <span class='hs-varid'>c</span> <a name="line-256"></a> <a name="line-257"></a><a name="encode_ch"></a><span class='hs-definition'>encode_ch</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>EncodedString</span> <a name="line-258"></a><span class='hs-definition'>encode_ch</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>unencodedChar</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyglyph'>[</span><span class='hs-varid'>c</span><span class='hs-keyglyph'>]</span> <span class='hs-comment'>-- Common case first</span> <a name="line-259"></a> <a name="line-260"></a><span class='hs-comment'>-- Constructors</span> <a name="line-261"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'('</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZL"</span> <span class='hs-comment'>-- Needed for things like (,), and (->)</span> <a name="line-262"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>')'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZR"</span> <span class='hs-comment'>-- For symmetry with (</span> <a name="line-263"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'['</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZM"</span> <a name="line-264"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>']'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZN"</span> <a name="line-265"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>':'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZC"</span> <a name="line-266"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'Z'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ZZ"</span> <a name="line-267"></a> <a name="line-268"></a><span class='hs-comment'>-- Variables</span> <a name="line-269"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'z'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zz"</span> <a name="line-270"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'&'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"za"</span> <a name="line-271"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'|'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zb"</span> <a name="line-272"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'^'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zc"</span> <a name="line-273"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'$'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zd"</span> <a name="line-274"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'='</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"ze"</span> <a name="line-275"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'>'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zg"</span> <a name="line-276"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'#'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zh"</span> <a name="line-277"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'.'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zi"</span> <a name="line-278"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'<'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zl"</span> <a name="line-279"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'-'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zm"</span> <a name="line-280"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'!'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zn"</span> <a name="line-281"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'+'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zp"</span> <a name="line-282"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'\''</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zq"</span> <a name="line-283"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'\\'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zr"</span> <a name="line-284"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'/'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zs"</span> <a name="line-285"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'*'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zt"</span> <a name="line-286"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'_'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zu"</span> <a name="line-287"></a><span class='hs-definition'>encode_ch</span> <span class='hs-chr'>'%'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"zv"</span> <a name="line-288"></a><span class='hs-definition'>encode_ch</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>encode_as_unicode_char</span> <span class='hs-varid'>c</span> <a name="line-289"></a> <a name="line-290"></a><a name="encode_as_unicode_char"></a><span class='hs-definition'>encode_as_unicode_char</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>EncodedString</span> <a name="line-291"></a><span class='hs-definition'>encode_as_unicode_char</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'z'</span> <span class='hs-conop'>:</span> <span class='hs-keyword'>if</span> <span class='hs-varid'>isDigit</span> <span class='hs-layout'>(</span><span class='hs-varid'>head</span> <span class='hs-varid'>hex_str</span><span class='hs-layout'>)</span> <span class='hs-keyword'>then</span> <span class='hs-varid'>hex_str</span> <a name="line-292"></a> <span class='hs-keyword'>else</span> <span class='hs-chr'>'0'</span><span class='hs-conop'>:</span><span class='hs-varid'>hex_str</span> <a name="line-293"></a> <span class='hs-keyword'>where</span> <span class='hs-varid'>hex_str</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>showHex</span> <span class='hs-layout'>(</span><span class='hs-varid'>ord</span> <span class='hs-varid'>c</span><span class='hs-layout'>)</span> <span class='hs-str'>"U"</span> <a name="line-294"></a> <span class='hs-comment'>-- ToDo: we could improve the encoding here in various ways.</span> <a name="line-295"></a> <span class='hs-comment'>-- eg. strings of unicode characters come out as 'z1234Uz5678U', we</span> <a name="line-296"></a> <span class='hs-comment'>-- could remove the 'U' in the middle (the 'z' works as a separator).</span> <a name="line-297"></a> <a name="line-298"></a><a name="zDecodeString"></a><span class='hs-definition'>zDecodeString</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>EncodedString</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>UserString</span> <a name="line-299"></a><span class='hs-definition'>zDecodeString</span> <span class='hs-conid'>[]</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>[]</span> <a name="line-300"></a><span class='hs-definition'>zDecodeString</span> <span class='hs-layout'>(</span><span class='hs-chr'>'Z'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>d</span> <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <a name="line-301"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>isDigit</span> <span class='hs-varid'>d</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>decode_tuple</span> <span class='hs-varid'>d</span> <span class='hs-varid'>rest</span> <a name="line-302"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>decode_upper</span> <span class='hs-varid'>d</span> <span class='hs-conop'>:</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span> <a name="line-303"></a><span class='hs-definition'>zDecodeString</span> <span class='hs-layout'>(</span><span class='hs-chr'>'z'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>d</span> <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <a name="line-304"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>isDigit</span> <span class='hs-varid'>d</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>decode_num_esc</span> <span class='hs-varid'>d</span> <span class='hs-varid'>rest</span> <a name="line-305"></a> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>otherwise</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>decode_lower</span> <span class='hs-varid'>d</span> <span class='hs-conop'>:</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span> <a name="line-306"></a><span class='hs-definition'>zDecodeString</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span> <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>c</span> <span class='hs-conop'>:</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span> <a name="line-307"></a> <a name="line-308"></a><a name="decode_upper"></a><span class='hs-definition'>decode_upper</span><span class='hs-layout'>,</span> <span class='hs-varid'>decode_lower</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Char</span> <a name="line-309"></a> <a name="line-310"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'L'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'('</span> <a name="line-311"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'R'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>')'</span> <a name="line-312"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'M'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'['</span> <a name="line-313"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'N'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>']'</span> <a name="line-314"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'C'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>':'</span> <a name="line-315"></a><span class='hs-definition'>decode_upper</span> <span class='hs-chr'>'Z'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'Z'</span> <a name="line-316"></a><span class='hs-definition'>decode_upper</span> <span class='hs-varid'>ch</span> <span class='hs-keyglyph'>=</span> <span class='hs-comment'>{-pprTrace "decode_upper" (char ch)-}</span> <span class='hs-varid'>ch</span> <a name="line-317"></a> <a name="line-318"></a><a name="decode_lower"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'z'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'z'</span> <a name="line-319"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'a'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'&'</span> <a name="line-320"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'b'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'|'</span> <a name="line-321"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'c'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'^'</span> <a name="line-322"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'d'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'$'</span> <a name="line-323"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'e'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'='</span> <a name="line-324"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'g'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'>'</span> <a name="line-325"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'h'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'#'</span> <a name="line-326"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'i'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'.'</span> <a name="line-327"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'l'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'<'</span> <a name="line-328"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'m'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'-'</span> <a name="line-329"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'n'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'!'</span> <a name="line-330"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'p'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'+'</span> <a name="line-331"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'q'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'\''</span> <a name="line-332"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'r'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'\\'</span> <a name="line-333"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'s'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'/'</span> <a name="line-334"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'t'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'*'</span> <a name="line-335"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'u'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'_'</span> <a name="line-336"></a><span class='hs-definition'>decode_lower</span> <span class='hs-chr'>'v'</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'%'</span> <a name="line-337"></a><span class='hs-definition'>decode_lower</span> <span class='hs-varid'>ch</span> <span class='hs-keyglyph'>=</span> <span class='hs-comment'>{-pprTrace "decode_lower" (char ch)-}</span> <span class='hs-varid'>ch</span> <a name="line-338"></a> <a name="line-339"></a><a name="decode_num_esc"></a><span class='hs-comment'>-- Characters not having a specific code are coded as z224U (in hex)</span> <a name="line-340"></a><span class='hs-definition'>decode_num_esc</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>EncodedString</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>UserString</span> <a name="line-341"></a><span class='hs-definition'>decode_num_esc</span> <span class='hs-varid'>d</span> <span class='hs-varid'>rest</span> <a name="line-342"></a> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>digitToInt</span> <span class='hs-varid'>d</span><span class='hs-layout'>)</span> <span class='hs-varid'>rest</span> <a name="line-343"></a> <span class='hs-keyword'>where</span> <a name="line-344"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span> <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>isHexDigit</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-num'>16</span><span class='hs-varop'>*</span><span class='hs-varid'>n</span> <span class='hs-varop'>+</span> <span class='hs-varid'>digitToInt</span> <span class='hs-varid'>c</span><span class='hs-layout'>)</span> <span class='hs-varid'>rest</span> <a name="line-345"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-chr'>'U'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>chr</span> <span class='hs-varid'>n</span> <span class='hs-conop'>:</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span> <a name="line-346"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-varid'>other</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>error</span> <span class='hs-layout'>(</span><span class='hs-str'>"decode_num_esc: "</span> <span class='hs-varop'>++</span> <span class='hs-varid'>show</span> <span class='hs-varid'>n</span> <span class='hs-varop'>++</span> <span class='hs-chr'>' '</span><span class='hs-conop'>:</span><span class='hs-varid'>other</span><span class='hs-layout'>)</span> <a name="line-347"></a> <a name="line-348"></a><a name="decode_tuple"></a><span class='hs-definition'>decode_tuple</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Char</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>EncodedString</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>UserString</span> <a name="line-349"></a><span class='hs-definition'>decode_tuple</span> <span class='hs-varid'>d</span> <span class='hs-varid'>rest</span> <a name="line-350"></a> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>digitToInt</span> <span class='hs-varid'>d</span><span class='hs-layout'>)</span> <span class='hs-varid'>rest</span> <a name="line-351"></a> <span class='hs-keyword'>where</span> <a name="line-352"></a> <span class='hs-comment'>-- NB. recurse back to zDecodeString after decoding the tuple, because</span> <a name="line-353"></a> <span class='hs-comment'>-- the tuple might be embedded in a longer name.</span> <a name="line-354"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-varid'>c</span> <span class='hs-conop'>:</span> <span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>isDigit</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-num'>10</span><span class='hs-varop'>*</span><span class='hs-varid'>n</span> <span class='hs-varop'>+</span> <span class='hs-varid'>digitToInt</span> <span class='hs-varid'>c</span><span class='hs-layout'>)</span> <span class='hs-varid'>rest</span> <a name="line-355"></a> <span class='hs-varid'>go</span> <span class='hs-num'>0</span> <span class='hs-layout'>(</span><span class='hs-chr'>'T'</span><span class='hs-conop'>:</span><span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"()"</span> <span class='hs-varop'>++</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span> <a name="line-356"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-chr'>'T'</span><span class='hs-conop'>:</span><span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'('</span> <span class='hs-conop'>:</span> <span class='hs-varid'>replicate</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-comment'>-</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-chr'>','</span> <span class='hs-varop'>++</span> <span class='hs-str'>")"</span> <span class='hs-varop'>++</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span> <a name="line-357"></a> <span class='hs-varid'>go</span> <span class='hs-num'>1</span> <span class='hs-layout'>(</span><span class='hs-chr'>'H'</span><span class='hs-conop'>:</span><span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"(# #)"</span> <span class='hs-varop'>++</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span> <a name="line-358"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-chr'>'H'</span><span class='hs-conop'>:</span><span class='hs-varid'>rest</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'('</span> <span class='hs-conop'>:</span> <span class='hs-chr'>'#'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>replicate</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-comment'>-</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-chr'>','</span> <span class='hs-varop'>++</span> <span class='hs-str'>"#)"</span> <span class='hs-varop'>++</span> <span class='hs-varid'>zDecodeString</span> <span class='hs-varid'>rest</span> <a name="line-359"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>n</span> <span class='hs-varid'>other</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>error</span> <span class='hs-layout'>(</span><span class='hs-str'>"decode_tuple: "</span> <span class='hs-varop'>++</span> <span class='hs-varid'>show</span> <span class='hs-varid'>n</span> <span class='hs-varop'>++</span> <span class='hs-chr'>' '</span><span class='hs-conop'>:</span><span class='hs-varid'>other</span><span class='hs-layout'>)</span> <a name="line-360"></a> <a name="line-361"></a><span class='hs-comment'>{- <a name="line-362"></a>Tuples are encoded as <a name="line-363"></a> Z3T or Z3H <a name="line-364"></a>for 3-tuples or unboxed 3-tuples respectively. No other encoding starts <a name="line-365"></a> Z<digit> <a name="line-366"></a> <a name="line-367"></a>* "(# #)" is the tycon for an unboxed 1-tuple (not 0-tuple) <a name="line-368"></a> There are no unboxed 0-tuples. <a name="line-369"></a> <a name="line-370"></a>* "()" is the tycon for a boxed 0-tuple. <a name="line-371"></a> There are no boxed 1-tuples. <a name="line-372"></a>-}</span> <a name="line-373"></a> <a name="line-374"></a><a name="maybe_tuple"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>UserString</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Maybe</span> <span class='hs-conid'>EncodedString</span> <a name="line-375"></a> <a name="line-376"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-str'>"(# #)"</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>Just</span><span class='hs-layout'>(</span><span class='hs-str'>"Z1H"</span><span class='hs-layout'>)</span> <a name="line-377"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-layout'>(</span><span class='hs-chr'>'('</span> <span class='hs-conop'>:</span> <span class='hs-chr'>'#'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>case</span> <span class='hs-varid'>count_commas</span> <span class='hs-layout'>(</span><span class='hs-num'>0</span><span class='hs-keyglyph'>::</span><span class='hs-conid'>Int</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span> <span class='hs-keyword'>of</span> <a name="line-378"></a> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-layout'>,</span> <span class='hs-chr'>'#'</span> <span class='hs-conop'>:</span> <span class='hs-chr'>')'</span> <span class='hs-conop'>:</span> <span class='hs-keyword'>_</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Just</span> <span class='hs-layout'>(</span><span class='hs-chr'>'Z'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>shows</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-str'>"H"</span><span class='hs-layout'>)</span> <a name="line-379"></a> <span class='hs-keyword'>_</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Nothing</span> <a name="line-380"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-str'>"()"</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>Just</span><span class='hs-layout'>(</span><span class='hs-str'>"Z0T"</span><span class='hs-layout'>)</span> <a name="line-381"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-layout'>(</span><span class='hs-chr'>'('</span> <span class='hs-conop'>:</span> <span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>case</span> <span class='hs-varid'>count_commas</span> <span class='hs-layout'>(</span><span class='hs-num'>0</span><span class='hs-keyglyph'>::</span><span class='hs-conid'>Int</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span> <span class='hs-keyword'>of</span> <a name="line-382"></a> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-layout'>,</span> <span class='hs-chr'>')'</span> <span class='hs-conop'>:</span> <span class='hs-keyword'>_</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Just</span> <span class='hs-layout'>(</span><span class='hs-chr'>'Z'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>shows</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-str'>"T"</span><span class='hs-layout'>)</span> <a name="line-383"></a> <span class='hs-keyword'>_</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Nothing</span> <a name="line-384"></a><span class='hs-definition'>maybe_tuple</span> <span class='hs-keyword'>_</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>Nothing</span> <a name="line-385"></a> <a name="line-386"></a><a name="count_commas"></a><span class='hs-definition'>count_commas</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Int</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>String</span> <span class='hs-keyglyph'>-></span> <span class='hs-layout'>(</span><span class='hs-conid'>Int</span><span class='hs-layout'>,</span> <span class='hs-conid'>String</span><span class='hs-layout'>)</span> <a name="line-387"></a><span class='hs-definition'>count_commas</span> <span class='hs-varid'>n</span> <span class='hs-layout'>(</span><span class='hs-chr'>','</span> <span class='hs-conop'>:</span> <span class='hs-varid'>cs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>count_commas</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-varop'>+</span><span class='hs-num'>1</span><span class='hs-layout'>)</span> <span class='hs-varid'>cs</span> <a name="line-388"></a><span class='hs-definition'>count_commas</span> <span class='hs-varid'>n</span> <span class='hs-varid'>cs</span> <span class='hs-keyglyph'>=</span> <span class='hs-layout'>(</span><span class='hs-varid'>n</span><span class='hs-layout'>,</span><span class='hs-varid'>cs</span><span class='hs-layout'>)</span> </pre></body> </html>