<?xml version="1.0" encoding="UTF-8"?> <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> <html> <head> <!-- Generated by HsColour, http://www.cs.york.ac.uk/fp/darcs/hscolour/ --> <title>src/Data/CSV.hs</title> <link type='text/css' rel='stylesheet' href='hscolour.css' /> </head> <body> <pre><a name="line-1"></a><span class='hs-comment'>{- arch-tag: CSV and TSV utilities <a name="line-2"></a>Copyright (C) 2005 John Goerzen <jgoerzen@complete.org> <a name="line-3"></a> <a name="line-4"></a>This program is free software; you can redistribute it and/or modify <a name="line-5"></a>it under the terms of the GNU General Public License as published by <a name="line-6"></a>the Free Software Foundation; either version 2 of the License, or <a name="line-7"></a>(at your option) any later version. <a name="line-8"></a> <a name="line-9"></a>This program is distributed in the hope that it will be useful, <a name="line-10"></a>but WITHOUT ANY WARRANTY; without even the implied warranty of <a name="line-11"></a>MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the <a name="line-12"></a>GNU General Public License for more details. <a name="line-13"></a> <a name="line-14"></a>You should have received a copy of the GNU General Public License <a name="line-15"></a>along with this program; if not, write to the Free Software <a name="line-16"></a>Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA <a name="line-17"></a>-}</span> <a name="line-18"></a> <a name="line-19"></a><span class='hs-comment'>{- | <a name="line-20"></a> Module : Data.CSV <a name="line-21"></a> Copyright : Copyright (C) 2005-2006 John Goerzen <a name="line-22"></a> License : GNU GPL, version 2 or above <a name="line-23"></a> <a name="line-24"></a> Maintainer : John Goerzen <jgoerzen@complete.org> <a name="line-25"></a> Stability : provisional <a name="line-26"></a> Portability: portable <a name="line-27"></a> <a name="line-28"></a>Haskell Parsec parsers for comma-separated value (CSV) files. <a name="line-29"></a> <a name="line-30"></a>Written by John Goerzen, jgoerzen\@complete.org <a name="line-31"></a>-}</span> <a name="line-32"></a> <a name="line-33"></a><span class='hs-keyword'>module</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>CSV</span> <span class='hs-layout'>(</span><span class='hs-varid'>csvFile</span><span class='hs-layout'>,</span> <span class='hs-varid'>genCsvFile</span><span class='hs-layout'>)</span> <span class='hs-keyword'>where</span> <a name="line-34"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Text</span><span class='hs-varop'>.</span><span class='hs-conid'>ParserCombinators</span><span class='hs-varop'>.</span><span class='hs-conid'>Parsec</span> <a name="line-35"></a><span class='hs-keyword'>import</span> <span class='hs-conid'>Data</span><span class='hs-varop'>.</span><span class='hs-conid'>List</span> <span class='hs-layout'>(</span><span class='hs-varid'>intersperse</span><span class='hs-layout'>)</span> <a name="line-36"></a> <a name="line-37"></a><a name="eol"></a><span class='hs-definition'>eol</span> <span class='hs-keyglyph'>::</span> <span class='hs-keyword'>forall</span> <span class='hs-varid'>st</span><span class='hs-varop'>.</span> <span class='hs-conid'>GenParser</span> <span class='hs-conid'>Char</span> <span class='hs-varid'>st</span> <span class='hs-conid'>String</span> <a name="line-38"></a><span class='hs-definition'>eol</span> <span class='hs-keyglyph'>=</span> <span class='hs-layout'>(</span><span class='hs-varid'>try</span> <span class='hs-varop'>$</span> <span class='hs-varid'>string</span> <span class='hs-str'>"\n\r"</span><span class='hs-layout'>)</span> <span class='hs-varop'><|></span> <span class='hs-layout'>(</span><span class='hs-varid'>try</span> <span class='hs-varop'>$</span> <span class='hs-varid'>string</span> <span class='hs-str'>"\r\n"</span><span class='hs-layout'>)</span> <span class='hs-varop'><|></span> <span class='hs-varid'>string</span> <span class='hs-str'>"\n"</span> <span class='hs-varop'><|></span> <a name="line-39"></a> <span class='hs-varid'>string</span> <span class='hs-str'>"\r"</span> <span class='hs-varop'><?></span> <span class='hs-str'>"End of line"</span> <a name="line-40"></a> <a name="line-41"></a><a name="cell"></a><span class='hs-definition'>cell</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>GenParser</span> <span class='hs-conid'>Char</span> <span class='hs-varid'>st</span> <span class='hs-conid'>String</span> <a name="line-42"></a><span class='hs-definition'>cell</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>quotedcell</span> <span class='hs-varop'><|></span> <span class='hs-varid'>many</span> <span class='hs-layout'>(</span><span class='hs-varid'>noneOf</span> <span class='hs-str'>",\n\r"</span><span class='hs-layout'>)</span> <a name="line-43"></a> <a name="line-44"></a><a name="quotedchar"></a><span class='hs-definition'>quotedchar</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>GenParser</span> <span class='hs-conid'>Char</span> <span class='hs-varid'>st</span> <span class='hs-conid'>Char</span> <a name="line-45"></a><span class='hs-definition'>quotedchar</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>noneOf</span> <span class='hs-str'>"\""</span> <a name="line-46"></a> <span class='hs-varop'><|></span> <span class='hs-layout'>(</span><span class='hs-varid'>try</span> <span class='hs-varop'>$</span> <span class='hs-keyword'>do</span> <span class='hs-varid'>string</span> <span class='hs-str'>"\"\""</span> <a name="line-47"></a> <span class='hs-varid'>return</span> <span class='hs-chr'>'"'</span> <a name="line-48"></a> <span class='hs-layout'>)</span> <a name="line-49"></a><a name="quotedcell"></a><span class='hs-definition'>quotedcell</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>CharParser</span> <span class='hs-varid'>st</span> <span class='hs-conid'>String</span> <a name="line-50"></a><span class='hs-definition'>quotedcell</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyword'>do</span> <span class='hs-varid'>char</span> <span class='hs-chr'>'"'</span> <a name="line-51"></a> <span class='hs-varid'>content</span> <span class='hs-keyglyph'><-</span> <span class='hs-varid'>many</span> <span class='hs-varid'>quotedchar</span> <a name="line-52"></a> <span class='hs-varid'>char</span> <span class='hs-chr'>'"'</span> <a name="line-53"></a> <span class='hs-varid'>return</span> <span class='hs-varid'>content</span> <a name="line-54"></a> <a name="line-55"></a><a name="line"></a><span class='hs-definition'>line</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>GenParser</span> <span class='hs-conid'>Char</span> <span class='hs-varid'>st</span> <span class='hs-keyglyph'>[</span><span class='hs-conid'>String</span><span class='hs-keyglyph'>]</span> <a name="line-56"></a><span class='hs-definition'>line</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>sepBy</span> <span class='hs-varid'>cell</span> <span class='hs-layout'>(</span><span class='hs-varid'>char</span> <span class='hs-chr'>','</span><span class='hs-layout'>)</span> <a name="line-57"></a> <a name="line-58"></a><span class='hs-comment'>{- | Parse a Comma-Separated Value (CSV) file. The return value is a list of <a name="line-59"></a>lines; each line is a list of cells; and each cell is a String. <a name="line-60"></a> <a name="line-61"></a>Please note that CSV files may have a different number of cells on each line. <a name="line-62"></a>Also, it is impossible to distinguish a CSV line that has a call with no data <a name="line-63"></a>from a CSV line that has no cells. <a name="line-64"></a> <a name="line-65"></a>Here are some examples: <a name="line-66"></a> <a name="line-67"></a>>Input (literal strings) Parses As (Haskell String syntax) <a name="line-68"></a>>-------------------------------- --------------------------------- <a name="line-69"></a>>1,2,3 [["1", "2", "3"]] <a name="line-70"></a>> <a name="line-71"></a>>l1 [["l1"], ["l2"]] <a name="line-72"></a>>l2 <a name="line-73"></a>> <a name="line-74"></a>> (empty line) [[""]] <a name="line-75"></a>> <a name="line-76"></a>>NQ,"Quoted" [["NQ", "Quoted"]] <a name="line-77"></a>> <a name="line-78"></a>>NQ,"Embedded""Quote" [["NQ", "Embedded\"Quote"]] <a name="line-79"></a> <a name="line-80"></a>To parse a String, you might use: <a name="line-81"></a> <a name="line-82"></a>>import Text.ParserCombinators.Parsec <a name="line-83"></a>>import Data.String.CSV <a name="line-84"></a>>.... <a name="line-85"></a>>parse csvFile "" mystring <a name="line-86"></a> <a name="line-87"></a>To parse a file, you might instead use: <a name="line-88"></a> <a name="line-89"></a>>do result <- parseFromFile csvFile "/path/to/file" <a name="line-90"></a> <a name="line-91"></a>Please note that the result of parsing will be of type <a name="line-92"></a>(Either ParseError [[String]]). A Left result indicates an error. <a name="line-93"></a>For more details, see the Parsec information. <a name="line-94"></a>-}</span> <a name="line-95"></a> <a name="line-96"></a><a name="csvFile"></a><span class='hs-definition'>csvFile</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>CharParser</span> <span class='hs-varid'>st</span> <span class='hs-keyglyph'>[</span><span class='hs-keyglyph'>[</span><span class='hs-conid'>String</span><span class='hs-keyglyph'>]</span><span class='hs-keyglyph'>]</span> <a name="line-97"></a><span class='hs-definition'>csvFile</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>endBy</span> <span class='hs-varid'>line</span> <span class='hs-varid'>eol</span> <a name="line-98"></a> <a name="line-99"></a><a name="genCsvFile"></a><span class='hs-comment'>{- | Generate CSV data for a file. The resulting string can be <a name="line-100"></a>written out to disk directly. -}</span> <a name="line-101"></a><span class='hs-definition'>genCsvFile</span> <span class='hs-keyglyph'>::</span> <span class='hs-keyglyph'>[</span><span class='hs-keyglyph'>[</span><span class='hs-conid'>String</span><span class='hs-keyglyph'>]</span><span class='hs-keyglyph'>]</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>String</span> <a name="line-102"></a><span class='hs-definition'>genCsvFile</span> <span class='hs-varid'>inp</span> <span class='hs-keyglyph'>=</span> <a name="line-103"></a> <span class='hs-varid'>unlines</span> <span class='hs-varop'>.</span> <span class='hs-varid'>map</span> <span class='hs-varid'>csvline</span> <span class='hs-varop'>$</span> <span class='hs-varid'>inp</span> <a name="line-104"></a> <span class='hs-keyword'>where</span> <span class='hs-varid'>csvline</span> <span class='hs-keyglyph'>::</span> <span class='hs-keyglyph'>[</span><span class='hs-conid'>String</span><span class='hs-keyglyph'>]</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>String</span> <a name="line-105"></a> <span class='hs-varid'>csvline</span> <span class='hs-varid'>l</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>concat</span> <span class='hs-varop'>.</span> <span class='hs-varid'>intersperse</span> <span class='hs-str'>","</span> <span class='hs-varop'>.</span> <span class='hs-varid'>map</span> <span class='hs-varid'>csvcells</span> <span class='hs-varop'>$</span> <span class='hs-varid'>l</span> <a name="line-106"></a> <span class='hs-varid'>csvcells</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>String</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>String</span> <a name="line-107"></a> <span class='hs-varid'>csvcells</span> <span class='hs-str'>""</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>""</span> <a name="line-108"></a> <span class='hs-varid'>csvcells</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-chr'>'"'</span> <span class='hs-conop'>:</span> <span class='hs-varid'>convcell</span> <span class='hs-varid'>c</span> <span class='hs-varop'>++</span> <span class='hs-str'>"\""</span> <a name="line-109"></a> <span class='hs-varid'>convcell</span> <span class='hs-keyglyph'>::</span> <span class='hs-conid'>String</span> <span class='hs-keyglyph'>-></span> <span class='hs-conid'>String</span> <a name="line-110"></a> <span class='hs-varid'>convcell</span> <span class='hs-varid'>c</span> <span class='hs-keyglyph'>=</span> <span class='hs-varid'>concatMap</span> <span class='hs-varid'>convchar</span> <span class='hs-varid'>c</span> <a name="line-111"></a> <span class='hs-varid'>convchar</span> <span class='hs-chr'>'"'</span> <span class='hs-keyglyph'>=</span> <span class='hs-str'>"\"\""</span> <a name="line-112"></a> <span class='hs-varid'>convchar</span> <span class='hs-varid'>x</span> <span class='hs-keyglyph'>=</span> <span class='hs-keyglyph'>[</span><span class='hs-varid'>x</span><span class='hs-keyglyph'>]</span> </pre></body> </html>