<?xml version="1.0" encoding="UTF-8"?> <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> <html> <head> <!-- Generated by HsColour, http://www.cs.york.ac.uk/fp/darcs/hscolour/ --> <title>Text/Regex/TDFA/ByteString.hs</title> <link type='text/css' rel='stylesheet' href='hscolour.css' /> </head> <body> <pre><a name="line-1"></a><span class='hs-comment'>{-| <a name="line-2"></a>This modules provides 'RegexMaker' and 'RegexLike' instances for using <a name="line-3"></a>'ByteString' with the DFA backend ("Text.Regex.Lib.WrapDFAEngine" and <a name="line-4"></a>"Text.Regex.Lazy.DFAEngineFPS"). This module is usually used via <a name="line-5"></a>import "Text.Regex.TDFA". <a name="line-6"></a> <a name="line-7"></a>This exports instances of the high level API and the medium level <a name="line-8"></a>API of 'compile','execute', and 'regexec'. <a name="line-9"></a>-}</span> <a name="line-10"></a><span class='hs-comment'>{- By Chris Kuklewicz, 2009. BSD License, see the LICENSE file. -}</span> <a name="line-11"></a><span class='hs-keyword'>module</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span><span class='hs-layout'>(</span> <a name="line-12"></a> <span class='hs-conid'>Regex</span> <a name="line-13"></a> <span class='hs-layout'>,</span><span class='hs-conid'>CompOption</span> <a name="line-14"></a> <span class='hs-layout'>,</span><span class='hs-conid'>ExecOption</span> <a name="line-15"></a> <span class='hs-layout'>,</span><span class='hs-varid'>compile</span> <a name="line-16"></a> <span class='hs-layout'>,</span><span class='hs-varid'>execute</span> <a name="line-17"></a> <span class='hs-layout'>,</span><span class='hs-varid'>regexec</span> <a name="line-18"></a> <span class='hs-layout'>)</span> <span class='hs-keyword'>where</span> <a name="line-19"></a> <a name="line-20"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>Array</span><span class='hs-layout'>(</span><span class='hs-layout'>(</span><span class='hs-varop'>!</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-varid'>elems</span><span class='hs-layout'>)</span> <a name="line-21"></a><span class='hs-keyword'>import</span> <span class='hs-keyword'>qualified</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span><span class='hs-varop'>.</span><span class='hs-conid'>Char8</span> <span class='hs-keyword'>as</span> <span class='hs-conid'>B</span><span class='hs-layout'>(</span><span class='hs-conid'>ByteString</span><span class='hs-layout'>,</span><span class='hs-varid'>take</span><span class='hs-layout'>,</span><span class='hs-varid'>drop</span><span class='hs-layout'>,</span><span class='hs-varid'>unpack</span><span class='hs-layout'>)</span> <a name="line-22"></a> <a name="line-23"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>Base</span><span class='hs-layout'>(</span><span class='hs-conid'>MatchArray</span><span class='hs-layout'>,</span><span class='hs-conid'>RegexContext</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-conid'>RegexMaker</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-conid'>RegexLike</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-24"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>Base</span><span class='hs-varop'>.</span><span class='hs-conid'>Impl</span><span class='hs-layout'>(</span><span class='hs-varid'>polymatch</span><span class='hs-layout'>,</span><span class='hs-varid'>polymatchM</span><span class='hs-layout'>)</span> <a name="line-25"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>ReadRegex</span><span class='hs-layout'>(</span><span class='hs-varid'>parseRegex</span><span class='hs-layout'>)</span> <a name="line-26"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>String</span><span class='hs-conid'>()</span> <span class='hs-comment'>-- piggyback on RegexMaker for String</span> <a name="line-27"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-layout'>(</span><span class='hs-varid'>patternToRegex</span><span class='hs-layout'>)</span> <a name="line-28"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>Common</span><span class='hs-layout'>(</span><span class='hs-conid'>Regex</span><span class='hs-layout'>(</span><span class='hs-keyglyph'>..</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-conid'>CompOption</span><span class='hs-layout'>,</span><span class='hs-conid'>ExecOption</span><span class='hs-layout'>(</span><span class='hs-varid'>captureGroups</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-29"></a> <a name="line-30"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>Maybe</span><span class='hs-layout'>(</span><span class='hs-varid'>listToMaybe</span><span class='hs-layout'>)</span> <a name="line-31"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>NewDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>Engine</span><span class='hs-layout'>(</span><span class='hs-varid'>execMatch</span><span class='hs-layout'>)</span> <a name="line-32"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>Regex</span><span class='hs-varop'>.</span><span class='hs-conid'>TDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>NewDFA</span><span class='hs-varop'>.</span><span class='hs-conid'>Tester</span> <span class='hs-keyword'>as</span> <span class='hs-conid'>Tester</span><span class='hs-layout'>(</span><span class='hs-varid'>matchTest</span><span class='hs-layout'>)</span> <a name="line-33"></a> <a name="line-34"></a><span class='hs-keyword'>instance</span> <span class='hs-conid'>RegexContext</span> <span class='hs-conid'>Regex</span> <span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span> <span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span> <span class='hs-keyword'>where</span> <a name="line-35"></a> <span class='hs-varid'>match</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>polymatch</span> <a name="line-36"></a> <span class='hs-varid'>matchM</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>polymatchM</span> <a name="line-37"></a> <a name="line-38"></a><span class='hs-keyword'>instance</span> <span class='hs-conid'>RegexMaker</span> <span class='hs-conid'>Regex</span> <span class='hs-conid'>CompOption</span> <span class='hs-conid'>ExecOption</span> <span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span> <span class='hs-keyword'>where</span> <a name="line-39"></a> <span class='hs-varid'>makeRegexOptsM</span> <span class='hs-varid'>c</span> <span class='hs-varid'>e</span> <span class='hs-varid'>source</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>makeRegexOptsM</span> <span class='hs-varid'>c</span> <span class='hs-varid'>e</span> <span class='hs-layout'>(</span><span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-varid'>unpack</span> <span class='hs-varid'>source</span><span class='hs-layout'>)</span> <a name="line-40"></a> <a name="line-41"></a><span class='hs-keyword'>instance</span> <span class='hs-conid'>RegexLike</span> <span class='hs-conid'>Regex</span> <span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span> <span class='hs-keyword'>where</span> <a name="line-42"></a> <span class='hs-varid'>matchOnce</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>listToMaybe</span> <span class='hs-layout'>(</span><span class='hs-varid'>matchAll</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span><span class='hs-layout'>)</span> <a name="line-43"></a> <span class='hs-varid'>matchAll</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>execMatch</span> <span class='hs-varid'>r</span> <span class='hs-num'>0</span> <span class='hs-chr'>'\n'</span> <span class='hs-varid'>s</span> <a name="line-44"></a> <span class='hs-varid'>matchCount</span> <span class='hs-varid'>r</span> <span class='hs-varid'>s</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>length</span> <span class='hs-layout'>(</span><span class='hs-varid'>matchAll</span> <span class='hs-varid'>r'</span> <span class='hs-varid'>s</span><span class='hs-layout'>)</span> <a name="line-45"></a> <span class='hs-keyword'>where</span> <span class='hs-varid'>r'</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>r</span> <span class='hs-layout'>{</span> <span class='hs-varid'>regex_execOptions</span> <span class='hs-keyglyph'>=</span> <span class='hs-layout'>(</span><span class='hs-varid'>regex_execOptions</span> <span class='hs-varid'>r</span><span class='hs-layout'>)</span> <span class='hs-layout'>{</span><span class='hs-varid'>captureGroups</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>False</span><span class='hs-layout'>}</span> <span class='hs-layout'>}</span> <a name="line-46"></a> <span class='hs-varid'>matchTest</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>Tester</span><span class='hs-varop'>.</span><span class='hs-varid'>matchTest</span> <a name="line-47"></a> <span class='hs-varid'>matchOnceText</span> <span class='hs-varid'>regex</span> <span class='hs-varid'>source</span> <span class='hs-keyglyph'>=</span> <a name="line-48"></a> <span class='hs-varid'>fmap</span> <span class='hs-layout'>(</span><span class='hs-keyglyph'>\</span><span class='hs-varid'>ma</span> <span class='hs-keyglyph'>-></span> <span class='hs-keyword'>let</span> <span class='hs-layout'>(</span><span class='hs-varid'>o</span><span class='hs-layout'>,</span><span class='hs-varid'>l</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>ma</span><span class='hs-varop'>!</span><span class='hs-num'>0</span> <a name="line-49"></a> <span class='hs-keyword'>in</span> <span class='hs-layout'>(</span><span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-varid'>take</span> <span class='hs-varid'>o</span> <span class='hs-varid'>source</span> <a name="line-50"></a> <span class='hs-layout'>,</span><span class='hs-varid'>fmap</span> <span class='hs-layout'>(</span><span class='hs-keyglyph'>\</span><span class='hs-varid'>ol</span><span class='hs-keyglyph'>@</span><span class='hs-layout'>(</span><span class='hs-varid'>off</span><span class='hs-layout'>,</span><span class='hs-varid'>len</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-></span> <span class='hs-layout'>(</span><span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-varid'>take</span> <span class='hs-varid'>len</span> <span class='hs-layout'>(</span><span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-varid'>drop</span> <span class='hs-varid'>off</span> <span class='hs-varid'>source</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-varid'>ol</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <span class='hs-varid'>ma</span> <a name="line-51"></a> <span class='hs-layout'>,</span><span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-varid'>drop</span> <span class='hs-layout'>(</span><span class='hs-varid'>o</span><span class='hs-varop'>+</span><span class='hs-varid'>l</span><span class='hs-layout'>)</span> <span class='hs-varid'>source</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-52"></a> <span class='hs-layout'>(</span><span class='hs-varid'>matchOnce</span> <span class='hs-varid'>regex</span> <span class='hs-varid'>source</span><span class='hs-layout'>)</span> <a name="line-53"></a> <span class='hs-varid'>matchAllText</span> <span class='hs-varid'>regex</span> <span class='hs-varid'>source</span> <span class='hs-keyglyph'>=</span> <a name="line-54"></a> <span class='hs-varid'>map</span> <span class='hs-layout'>(</span><span class='hs-varid'>fmap</span> <span class='hs-layout'>(</span><span class='hs-keyglyph'>\</span><span class='hs-varid'>ol</span><span class='hs-keyglyph'>@</span><span class='hs-layout'>(</span><span class='hs-varid'>off</span><span class='hs-layout'>,</span><span class='hs-varid'>len</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-></span> <span class='hs-layout'>(</span><span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-varid'>take</span> <span class='hs-varid'>len</span> <span class='hs-layout'>(</span><span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-varid'>drop</span> <span class='hs-varid'>off</span> <span class='hs-varid'>source</span><span class='hs-layout'>)</span><span class='hs-layout'>,</span><span class='hs-varid'>ol</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-55"></a> <span class='hs-layout'>(</span><span class='hs-varid'>matchAll</span> <span class='hs-varid'>regex</span> <span class='hs-varid'>source</span><span class='hs-layout'>)</span> <a name="line-56"></a> <a name="line-57"></a><a name="compile"></a><span class='hs-definition'>compile</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>CompOption</span> <span class='hs-comment'>-- ^ Flags (summed together)</span> <a name="line-58"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>ExecOption</span> <span class='hs-comment'>-- ^ Flags (summed together)</span> <a name="line-59"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span> <span class='hs-comment'>-- ^ The regular expression to compile</span> <a name="line-60"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Either</span> <span class='hs-conid'>String</span> <span class='hs-conid'>Regex</span> <span class='hs-comment'>-- ^ Returns: the compiled regular expression</span> <a name="line-61"></a><span class='hs-definition'>compile</span> <span class='hs-varid'>compOpt</span> <span class='hs-varid'>execOpt</span> <span class='hs-varid'>bs</span> <span class='hs-keyglyph'>=</span> <a name="line-62"></a> <span class='hs-keyword'>case</span> <span class='hs-varid'>parseRegex</span> <span class='hs-layout'>(</span><span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-varid'>unpack</span> <span class='hs-varid'>bs</span><span class='hs-layout'>)</span> <span class='hs-keyword'>of</span> <a name="line-63"></a> <span class='hs-conid'>Left</span> <span class='hs-varid'>err</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Left</span> <span class='hs-layout'>(</span><span class='hs-str'>"parseRegex for Text.Regex.TDFA.ByteString failed:"</span><span class='hs-varop'>++</span><span class='hs-varid'>show</span> <span class='hs-varid'>err</span><span class='hs-layout'>)</span> <a name="line-64"></a> <span class='hs-conid'>Right</span> <span class='hs-varid'>pattern</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Right</span> <span class='hs-layout'>(</span><span class='hs-varid'>patternToRegex</span> <span class='hs-varid'>pattern</span> <span class='hs-varid'>compOpt</span> <span class='hs-varid'>execOpt</span><span class='hs-layout'>)</span> <a name="line-65"></a> <a name="line-66"></a><a name="execute"></a><span class='hs-definition'>execute</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Regex</span> <span class='hs-comment'>-- ^ Compiled regular expression</span> <a name="line-67"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span> <span class='hs-comment'>-- ^ ByteString to match against</span> <a name="line-68"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Either</span> <span class='hs-conid'>String</span> <span class='hs-layout'>(</span><span class='hs-conid'>Maybe</span> <span class='hs-conid'>MatchArray</span><span class='hs-layout'>)</span> <a name="line-69"></a><span class='hs-definition'>execute</span> <span class='hs-varid'>r</span> <span class='hs-varid'>bs</span> <span class='hs-keyglyph'>=</span> <span class='hs-conid'>Right</span> <span class='hs-layout'>(</span><span class='hs-varid'>matchOnce</span> <span class='hs-varid'>r</span> <span class='hs-varid'>bs</span><span class='hs-layout'>)</span> <a name="line-70"></a> <a name="line-71"></a><a name="regexec"></a><span class='hs-definition'>regexec</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>Regex</span> <span class='hs-comment'>-- ^ Compiled regular expression</span> <a name="line-72"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span> <span class='hs-comment'>-- ^ ByteString to match against</span> <a name="line-73"></a> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Either</span> <span class='hs-conid'>String</span> <span class='hs-layout'>(</span><span class='hs-conid'>Maybe</span> <span class='hs-layout'>(</span><span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span><span class='hs-layout'>,</span> <span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span><span class='hs-layout'>,</span> <span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span><span class='hs-layout'>,</span> <span class='hs-keyglyph'>[</span><span class='hs-conid'>B</span><span class='hs-varop'>.</span><span class='hs-conid'>ByteString</span><span class='hs-keyglyph'>]</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <a name="line-74"></a><span class='hs-definition'>regexec</span> <span class='hs-varid'>r</span> <span class='hs-varid'>bs</span> <span class='hs-keyglyph'>=</span> <a name="line-75"></a> <span class='hs-keyword'>case</span> <span class='hs-varid'>matchOnceText</span> <span class='hs-varid'>r</span> <span class='hs-varid'>bs</span> <span class='hs-keyword'>of</span> <a name="line-76"></a> <span class='hs-conid'>Nothing</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>Right</span> <span class='hs-layout'>(</span><span class='hs-conid'>Nothing</span><span class='hs-layout'>)</span> <a name="line-77"></a> <span class='hs-conid'>Just</span> <span class='hs-layout'>(</span><span class='hs-varid'>pre</span><span class='hs-layout'>,</span><span class='hs-varid'>mt</span><span class='hs-layout'>,</span><span class='hs-varid'>post</span><span class='hs-layout'>)</span> <span class='hs-keyglyph'>-></span> <a name="line-78"></a> <span class='hs-keyword'>let</span> <span class='hs-varid'>main</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>fst</span> <span class='hs-layout'>(</span><span class='hs-varid'>mt</span><span class='hs-varop'>!</span><span class='hs-num'>0</span><span class='hs-layout'>)</span> <a name="line-79"></a> <span class='hs-varid'>rest</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>map</span> <span class='hs-varid'>fst</span> <span class='hs-layout'>(</span><span class='hs-varid'>tail</span> <span class='hs-layout'>(</span><span class='hs-varid'>elems</span> <span class='hs-varid'>mt</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> <span class='hs-comment'>-- will be []</span> <a name="line-80"></a> <span class='hs-keyword'>in</span> <span class='hs-conid'>Right</span> <span class='hs-layout'>(</span><span class='hs-conid'>Just</span> <span class='hs-layout'>(</span><span class='hs-varid'>pre</span><span class='hs-layout'>,</span><span class='hs-varid'>main</span><span class='hs-layout'>,</span><span class='hs-varid'>post</span><span class='hs-layout'>,</span><span class='hs-varid'>rest</span><span class='hs-layout'>)</span><span class='hs-layout'>)</span> </pre></body> </html>