<?xml version="1.0" encoding="UTF-8"?> <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> <html> <head> <!-- Generated by HsColour, http://www.cs.york.ac.uk/fp/darcs/hscolour/ --> <title>Text/Regex/TDFA/String.hs</title> <link type='text/css' rel='stylesheet' href='hscolour.css' /> </head> <body> <pre><a name="line-1"></a><span class='hs-comment'>{- | <a name="line-2"></a>This modules provides 'RegexMaker' and 'RegexLike' instances for using <a name="line-3"></a>'String' with the TDFA backend. <a name="line-4"></a> <a name="line-5"></a>This exports instances of the high level API and the medium level <a name="line-6"></a>API of 'compile','execute', and 'regexec'. <a name="line-7"></a>-}</span> <a name="line-8"></a><span class='hs-comment'>{- By Chris Kuklewicz, 2009. BSD License, see the LICENSE file. -}</span> <a name="line-9"></a><span class='hs-keyword'>module</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>String</span><span class='hs-layout'>(</span> <a name="line-10"></a> <span class='hs-comment'>-- ** Types</span> <a name="line-11"></a> <span class='hs-conid'>Regex</span> <a name="line-12"></a> <span class='hs-layout'>,</span><span class='hs-conid'>MatchOffset</span> <a name="line-13"></a> <span class='hs-layout'>,</span><span class='hs-conid'>MatchLength</span> <a name="line-14"></a> <span class='hs-layout'>,</span><span class='hs-conid'>CompOption</span> <a name="line-15"></a> <span class='hs-layout'>,</span><span class='hs-conid'>ExecOption</span> <a name="line-16"></a> <span class='hs-comment'>-- ** Medium level API functions</span> <a name="line-17"></a> <span class='hs-layout'>,</span><span class='hs-varid'>compile</span> <a name="line-18"></a> <span class='hs-layout'>,</span><span class='hs-varid'>execute</span> <a name="line-19"></a> <span class='hs-layout'>,</span><span class='hs-varid'>regexec</span> <a name="line-20"></a> <span class='hs-layout'>)</span> <span class='hs-keyword'>where</span> <a name="line-21"></a> <a name="line-22"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>Base</span><span class='hs-varop'>.</span><span class='hs-conid'>Impl</span><span class='hs-layout'>(</span><span class='hs-varid'>polymatch</span><span class='hs-layout'>,</span><span class='hs-varid'>polymatchM</span><span class='hs-layout'>)</span> <a name="line-23"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>Base</span><span class='hs-varop'>.</span><span class='hs-conid'>RegexLike</span><span class='hs-layout'>(</span><span class='hs-conid'>RegexMaker</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-conid'>RegexLike</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-conid'>RegexContext</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-conid'>MatchOffset</span><span class='hs-layout'>,</span><span class='hs-conid'>MatchLength</span><span class='hs-layout'>,</span><span class='hs-conid'>MatchArray</span><span class='hs-layout'>)</span> <a name="line-24"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>Common</span><span class='hs-layout'>(</span><span class='hs-varid'>common_error</span><span class='hs-layout'>,</span><span class='hs-conid'>Regex</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-conid'>CompOption</span><span class='hs-layout'>,</span><span class='hs-conid'>ExecOption</span><span class='hs-layout'>(</span><span class='hs-varid'>captureGroups</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-25"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>ReadRegex</span><span class='hs-layout'>(</span><span class='hs-varid'>parseRegex</span><span class='hs-layout'>)</span> <a name="line-26"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-layout'>(</span><span class='hs-varid'>patternToRegex</span><span class='hs-layout'>)</span> <a name="line-27"></a> <a name="line-28"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>Array</span><span class='hs-varop'>.</span><span class='hs-conid'>IArray</span><span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varop'>!</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-varid'>elems</span><span class='hs-layout'>,</span><span class='hs-varid'>amap</span><span class='hs-layout'>)</span> <a name="line-29"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>Maybe</span><span class='hs-layout'>(</span><span class='hs-varid'>listToMaybe</span><span class='hs-layout'>)</span> <a name="line-30"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>NewDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>Engine</span><span class='hs-layout'>(</span><span class='hs-varid'>execMatch</span><span class='hs-layout'>)</span> <a name="line-31"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>NewDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>Tester</span> <span class='hs-keyword'>as</span> <span class='hs-conid'>Tester</span><span class='hs-layout'>(</span><span class='hs-varid'>matchTest</span><span class='hs-layout'>)</span> <a name="line-32"></a> <a name="line-33"></a><a name="err"></a><span class='hs-definition'>err</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>String</span> <span class='hs-keyglyph'>-></span> <span class='hs-varid'>a</span> <a name="line-34"></a><span class='hs-definition'>err</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>common_error</span> <span class='hs-str'>"Text.Regex.TDFA.String"</span> <a name="line-35"></a> <a name="line-36"></a><a name="unwrap"></a><span class='hs-definition'>unwrap</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Either</span> <span class='hs-conid'>String</span> <span class='hs-varid'>v</span> <span class='hs-keyglyph'>-></span> <span class='hs-varid'>v</span> <a name="line-37"></a><span class='hs-definition'>unwrap</span> <span class='hs-varid'>x</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>case</span> <span class='hs-varid'>x</span> <span class='hs-keyword'>of</span> <span class='hs-conid'>Left</span> <span class='hs-varid'>msg</span> <span class='hs-keyglyph'>-></span> <span class='hs-varid'>err</span> <span class='hs-layout'>(</span><span class='hs-str'>"Text.Regex.TDFA.String died: "</span><span class='hs-varop'>++</span><span class='hs-varid'>msg</span><span class='hs-layout'>)</span> <a name="line-38"></a> <span class='hs-conid'>Right</span> <span class='hs-varid'>v</span> <span class='hs-keyglyph'>-></span> <span class='hs-varid'>v</span> <a name="line-39"></a> <a name="line-40"></a><a name="compile"></a><span class='hs-definition'>compile</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>CompOption</span> <span class='hs-comment'>-- ^ Flags (summed together)</span> <a name="line-41"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>ExecOption</span> <span class='hs-comment'>-- ^ Flags (summed together)</span> <a name="line-42"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>String</span> <span class='hs-comment'>-- ^ The regular expression to compile (ASCII only, no null bytes)</span> <a name="line-43"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Either</span> <span class='hs-conid'>String</span> <span class='hs-conid'>Regex</span> <span class='hs-comment'>-- ^ Returns: the compiled regular expression</span> <a name="line-44"></a><span class='hs-definition'>compile</span> <span class='hs-varid'>compOpt</span> <span class='hs-varid'>execOpt</span> <span class='hs-varid'>source</span> <span class='hs-keyglyph'>=</span> <a name="line-45"></a> <span class='hs-keyword'>case</span> <span class='hs-varid'>parseRegex</span> <span class='hs-varid'>source</span> <span class='hs-keyword'>of</span> <a name="line-46"></a> <span class='hs-conid'>Left</span> <span class='hs-varid'>msg</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Left</span> <span class='hs-layout'>(</span><span class='hs-str'>"parseRegex for Text.Regex.TDFA.String failed:"</span><span class='hs-varop'>++</span><span class='hs-varid'>show</span> <span class='hs-varid'>msg</span><span class='hs-layout'>)</span> <a name="line-47"></a> <span class='hs-conid'>Right</span> <span class='hs-varid'>pattern</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Right</span> <span class='hs-layout'>(</span><span class='hs-varid'>patternToRegex</span> <span class='hs-varid'>pattern</span> <span class='hs-varid'>compOpt</span> <span class='hs-varid'>execOpt</span><span class='hs-layout'>)</span> <a name="line-48"></a> <a name="line-49"></a><span class='hs-keyword'>instance</span> <span class='hs-conid'>RegexMaker</span> <span class='hs-conid'>Regex</span> <span class='hs-conid'>CompOption</span> <span class='hs-conid'>ExecOption</span> <span class='hs-conid'>String</span> <span class='hs-keyword'>where</span> <a name="line-50"></a> <span class='hs-varid'>makeRegexOpts</span> <span class='hs-varid'>c</span> <span class='hs-varid'>e</span> <span class='hs-varid'>source</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>unwrap</span> <span class='hs-layout'>(</span><span class='hs-varid'>compile</span> <span class='hs-varid'>c</span> <span class='hs-varid'>e</span> <span class='hs-varid'>source</span><span class='hs-layout'>)</span> <a name="line-51"></a> <span class='hs-varid'>makeRegexOptsM</span> <span class='hs-varid'>c</span> <span class='hs-varid'>e</span> <span class='hs-varid'>source</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>either</span> <span class='hs-varid'>fail</span> <span class='hs-varid'>return</span> <span class='hs-varop'>$</span> <span class='hs-varid'>compile</span> <span class='hs-varid'>c</span> <span class='hs-varid'>e</span> <span class='hs-varid'>source</span> <a name="line-52"></a> <a name="line-53"></a><a name="execute"></a><span class='hs-definition'>execute</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Regex</span> <span class='hs-comment'>-- ^ Compiled regular expression</span> <a name="line-54"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>String</span> <span class='hs-comment'>-- ^ String to match against</span> <a name="line-55"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Either</span> <span class='hs-conid'>String</span> <span class='hs-layout'>(</span><span class='hs-conid'>Maybe</span> <span class='hs-conid'>MatchArray</span><span class='hs-layout'>)</span> <a name="line-56"></a><span class='hs-definition'>execute</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>Right</span> <span class='hs-layout'>(</span><span class='hs-varid'>matchOnce</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span><span class='hs-layout'>)</span> <a name="line-57"></a> <a name="line-58"></a><a name="regexec"></a><span class='hs-definition'>regexec</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Regex</span> <span class='hs-comment'>-- ^ Compiled regular expression</span> <a name="line-59"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>String</span> <span class='hs-comment'>-- ^ String to match against</span> <a name="line-60"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Either</span> <span class='hs-conid'>String</span> <span class='hs-layout'>(</span><span class='hs-conid'>Maybe</span> <span class='hs-layout'>(</span><span class='hs-conid'>String</span><span class='hs-layout'>,</span> <span class='hs-conid'>String</span><span class='hs-layout'>,</span> <span class='hs-conid'>String</span><span class='hs-layout'>,</span> <span class='hs-keyglyph'>[</span><span class='hs-conid'>String</span><span class='hs-keyglyph'>]</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-61"></a><span class='hs-definition'>regexec</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span> <span class='hs-keyglyph'>=</span> <a name="line-62"></a> <span class='hs-keyword'>case</span> <span class='hs-varid'>matchOnceText</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span> <span class='hs-keyword'>of</span> <a name="line-63"></a> <span class='hs-conid'>Nothing</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Right</span> <span class='hs-conid'>Nothing</span> <a name="line-64"></a> <span class='hs-conid'>Just</span> <span class='hs-layout'>(</span><span class='hs-varid'>pre</span><span class='hs-layout'>,</span><span class='hs-varid'>mt</span><span class='hs-layout'>,</span><span class='hs-varid'>post</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-></span> <a name="line-65"></a> <span class='hs-keyword'>let</span> <span class='hs-varid'>main</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>fst</span> <span class='hs-layout'>(</span><span class='hs-varid'>mt</span><span class='hs-varop'>!</span><span class='hs-num'>0</span><span class='hs-layout'>)</span> <a name="line-66"></a> <span class='hs-varid'>rest</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>map</span> <span class='hs-varid'>fst</span> <span class='hs-layout'>(</span><span class='hs-varid'>tail</span> <span class='hs-layout'>(</span><span class='hs-varid'>elems</span> <span class='hs-varid'>mt</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <span class='hs-comment'>-- will be []</span> <a name="line-67"></a> <span class='hs-keyword'>in</span> <span class='hs-conid'>Right</span> <span class='hs-layout'>(</span><span class='hs-conid'>Just</span> <span class='hs-layout'>(</span><span class='hs-varid'>pre</span><span class='hs-layout'>,</span><span class='hs-varid'>main</span><span class='hs-layout'>,</span><span class='hs-varid'>post</span><span class='hs-layout'>,</span><span class='hs-varid'>rest</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-68"></a> <a name="line-69"></a><span class='hs-comment'>-- Minimal defintion for now</span> <a name="line-70"></a><span class='hs-keyword'>instance</span> <span class='hs-conid'>RegexLike</span> <span class='hs-conid'>Regex</span> <span class='hs-conid'>String</span> <span class='hs-keyword'>where</span> <a name="line-71"></a> <span class='hs-varid'>matchOnce</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>listToMaybe</span> <span class='hs-layout'>(</span><span class='hs-varid'>matchAll</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span><span class='hs-layout'>)</span> <a name="line-72"></a> <span class='hs-varid'>matchAll</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>execMatch</span> <span class='hs-varid'>r</span> <span class='hs-num'>0</span> <span class='hs-chr'>'\n'</span> <span class='hs-varid'>s</span> <a name="line-73"></a> <span class='hs-varid'>matchCount</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>length</span> <span class='hs-layout'>(</span><span class='hs-varid'>matchAll</span> <span class='hs-varid'>r'</span> <span class='hs-varid'>s</span><span class='hs-layout'>)</span> <a name="line-74"></a> <span class='hs-keyword'>where</span> <span class='hs-varid'>r'</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>r</span> <span class='hs-layout'>{</span> <span class='hs-varid'>regex_execOptions</span> <span class='hs-keyglyph'>=</span> <span class='hs-layout'>(</span><span class='hs-varid'>regex_execOptions</span> <span class='hs-varid'>r</span><span class='hs-layout'>)</span> <span class='hs-layout'>{</span><span class='hs-varid'>captureGroups</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>False</span><span class='hs-layout'>}</span> <span class='hs-layout'>}</span> <a name="line-75"></a> <span class='hs-varid'>matchTest</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>Tester</span><span class='hs-varop'>.</span><span class='hs-varid'>matchTest</span> <a name="line-76"></a> <span class='hs-comment'>-- matchOnceText</span> <a name="line-77"></a> <span class='hs-varid'>matchAllText</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span> <span class='hs-keyglyph'>=</span> <a name="line-78"></a> <span class='hs-keyword'>let</span> <span class='hs-varid'>go</span> <span class='hs-varid'>i</span> <span class='hs-keyword'>_</span> <span class='hs-keyword'>_</span> <span class='hs-keyglyph'>|</span> <span class='hs-varid'>i</span> <span class='hs-varop'>`seq`</span> <span class='hs-conid'>False</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>undefined</span> <a name="line-79"></a> <span class='hs-varid'>go</span> <span class='hs-sel'>_i</span> <span class='hs-sel'>_t</span> <span class='hs-conid'>[]</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>[]</span> <a name="line-80"></a> <span class='hs-varid'>go</span> <span class='hs-varid'>i</span> <span class='hs-varid'>t</span> <span class='hs-layout'>(</span><span class='hs-varid'>x</span><span class='hs-conop'>:</span><span class='hs-varid'>xs</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>let</span> <span class='hs-layout'>(</span><span class='hs-varid'>off0</span><span class='hs-layout'>,</span><span class='hs-varid'>len0</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>x</span><span class='hs-varop'>!</span><span class='hs-num'>0</span> <a name="line-81"></a> <span class='hs-varid'>trans</span> <span class='hs-varid'>pair</span><span class='hs-keyglyph'>@</span><span class='hs-layout'>(</span><span class='hs-varid'>off</span><span class='hs-layout'>,</span><span class='hs-varid'>len</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-layout'>(</span><span class='hs-varid'>take</span> <span class='hs-varid'>len</span> <span class='hs-layout'>(</span><span class='hs-varid'>drop</span> <span class='hs-layout'>(</span><span class='hs-varid'>off</span><span class='hs-comment'>-</span><span class='hs-varid'>i</span><span class='hs-layout'>)</span> <span class='hs-varid'>t</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-varid'>pair</span><span class='hs-layout'>)</span> <a name="line-82"></a> <span class='hs-varid'>t'</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>drop</span> <span class='hs-layout'>(</span><span class='hs-varid'>off0</span><span class='hs-varop'>+</span><span class='hs-varid'>len0</span><span class='hs-comment'>-</span><span class='hs-varid'>i</span><span class='hs-layout'>)</span> <span class='hs-varid'>t</span> <a name="line-83"></a> <span class='hs-keyword'>in</span> <span class='hs-varid'>amap</span> <span class='hs-varid'>trans</span> <span class='hs-varid'>x</span> <span class='hs-conop'>:</span> <span class='hs-varid'>seq</span> <span class='hs-varid'>t'</span> <span class='hs-layout'>(</span><span class='hs-varid'>go</span> <span class='hs-layout'>(</span><span class='hs-varid'>off0</span><span class='hs-varop'>+</span><span class='hs-varid'>len0</span><span class='hs-layout'>)</span> <span class='hs-varid'>t'</span> <span class='hs-varid'>xs</span><span class='hs-layout'>)</span> <a name="line-84"></a> <span class='hs-keyword'>in</span> <span class='hs-varid'>go</span> <span class='hs-num'>0</span> <span class='hs-varid'>s</span> <span class='hs-layout'>(</span><span class='hs-varid'>matchAll</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span><span class='hs-layout'>)</span> <a name="line-85"></a> <a name="line-86"></a><span class='hs-keyword'>instance</span> <span class='hs-conid'>RegexContext</span> <span class='hs-conid'>Regex</span> <span class='hs-conid'>String</span> <span class='hs-conid'>String</span> <span class='hs-keyword'>where</span> <a name="line-87"></a> <span class='hs-varid'>match</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>polymatch</span> <a name="line-88"></a> <span class='hs-varid'>matchM</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>polymatchM</span> </pre></body> </html>