Sophie

Sophie

distrib > Mageia > 6 > armv5tl > media > core-release > by-pkgid > 3a4e91bde08970529a0aa07935652fe8 > files > 959

icu-doc-58.2-3.mga6.noarch.rpm

<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
<meta name="generator" content="Doxygen 1.8.11"/>
<title>ICU 58.2: ucsdet.h File Reference</title>
<link href="tabs.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="jquery.js"></script>
<script type="text/javascript" src="dynsections.js"></script>
<link href="doxygen.css" rel="stylesheet" type="text/css" />
</head>
<body>
<div id="top"><!-- do not remove this div, it is closed by doxygen! -->
<div id="titlearea">
<table cellspacing="0" cellpadding="0">
 <tbody>
 <tr style="height: 56px;">
  <td id="projectalign" style="padding-left: 0.5em;">
   <div id="projectname">ICU 58.2
   &#160;<span id="projectnumber">58.2</span>
   </div>
  </td>
 </tr>
 </tbody>
</table>
</div>
<!-- end header part -->
<!-- Generated by Doxygen 1.8.11 -->
  <div id="navrow1" class="tabs">
    <ul class="tablist">
      <li><a href="index.html"><span>Main&#160;Page</span></a></li>
      <li><a href="pages.html"><span>Related&#160;Pages</span></a></li>
      <li><a href="modules.html"><span>Modules</span></a></li>
      <li><a href="namespaces.html"><span>Namespaces</span></a></li>
      <li><a href="annotated.html"><span>Data&#160;Structures</span></a></li>
      <li class="current"><a href="files.html"><span>Files</span></a></li>
    </ul>
  </div>
  <div id="navrow2" class="tabs2">
    <ul class="tablist">
      <li><a href="files.html"><span>File&#160;List</span></a></li>
      <li><a href="globals.html"><span>Globals</span></a></li>
    </ul>
  </div>
<div id="nav-path" class="navpath">
  <ul>
<li class="navelem"><a class="el" href="dir_b2f33c71d4aa5e7af42a1ca61ff5af1b.html">source</a></li><li class="navelem"><a class="el" href="dir_3c42bef9a3e7804b3d74ebb2809ebf86.html">i18n</a></li><li class="navelem"><a class="el" href="dir_fa4147b4d9cbc9ae7619e21b25239322.html">unicode</a></li>  </ul>
</div>
</div><!-- top -->
<div class="header">
  <div class="summary">
<a href="#namespaces">Namespaces</a> &#124;
<a href="#typedef-members">Typedefs</a> &#124;
<a href="#func-members">Functions</a>  </div>
  <div class="headertitle">
<div class="title">ucsdet.h File Reference</div>  </div>
</div><!--header-->
<div class="contents">

<p>C API: Charset Detection API.  
<a href="#details">More...</a></p>
<div class="textblock"><code>#include &quot;<a class="el" href="utypes_8h_source.html">unicode/utypes.h</a>&quot;</code><br />
<code>#include &quot;<a class="el" href="localpointer_8h_source.html">unicode/localpointer.h</a>&quot;</code><br />
<code>#include &quot;<a class="el" href="uenum_8h_source.html">unicode/uenum.h</a>&quot;</code><br />
</div>
<p><a href="ucsdet_8h_source.html">Go to the source code of this file.</a></p>
<table class="memberdecls">
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a name="namespaces"></a>
Namespaces</h2></td></tr>
<tr class="memitem:namespaceicu"><td class="memItemLeft" align="right" valign="top"> &#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="namespaceicu.html">icu</a></td></tr>
<tr class="memdesc:namespaceicu"><td class="mdescLeft">&#160;</td><td class="mdescRight">File <a class="el" href="coll_8h.html" title="C++ API: Collation Service. ">coll.h</a>. <br /></td></tr>
<tr class="separator:"><td class="memSeparator" colspan="2">&#160;</td></tr>
</table><table class="memberdecls">
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a name="typedef-members"></a>
Typedefs</h2></td></tr>
<tr class="memitem:a8f341f9c43bf58b112afd70c8a94c45d"><td class="memItemLeft" align="right" valign="top">typedef struct <a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a>&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a></td></tr>
<tr class="memdesc:a8f341f9c43bf58b112afd70c8a94c45d"><td class="mdescLeft">&#160;</td><td class="mdescRight">Structure representing a charset detector.  <a href="#a8f341f9c43bf58b112afd70c8a94c45d">More...</a><br /></td></tr>
<tr class="separator:a8f341f9c43bf58b112afd70c8a94c45d"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:a4e40a6a6dae057f9257e144fc65ba667"><td class="memItemLeft" align="right" valign="top">typedef struct <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a>&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a></td></tr>
<tr class="memdesc:a4e40a6a6dae057f9257e144fc65ba667"><td class="mdescLeft">&#160;</td><td class="mdescRight">Opaque structure representing a match that was identified from a charset detection operation.  <a href="#a4e40a6a6dae057f9257e144fc65ba667">More...</a><br /></td></tr>
<tr class="separator:a4e40a6a6dae057f9257e144fc65ba667"><td class="memSeparator" colspan="2">&#160;</td></tr>
</table><table class="memberdecls">
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a name="func-members"></a>
Functions</h2></td></tr>
<tr class="memitem:abf2d3c7b731982895433cfbeb6c29cdd"><td class="memItemLeft" align="right" valign="top"><a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#abf2d3c7b731982895433cfbeb6c29cdd">ucsdet_open</a> (<a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:abf2d3c7b731982895433cfbeb6c29cdd"><td class="mdescLeft">&#160;</td><td class="mdescRight">Open a charset detector.  <a href="#abf2d3c7b731982895433cfbeb6c29cdd">More...</a><br /></td></tr>
<tr class="separator:abf2d3c7b731982895433cfbeb6c29cdd"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:a84dab4d2c56fedb624a01db170ba698c"><td class="memItemLeft" align="right" valign="top">void&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#a84dab4d2c56fedb624a01db170ba698c">ucsdet_close</a> (<a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *ucsd)</td></tr>
<tr class="memdesc:a84dab4d2c56fedb624a01db170ba698c"><td class="mdescLeft">&#160;</td><td class="mdescRight">Close a charset detector.  <a href="#a84dab4d2c56fedb624a01db170ba698c">More...</a><br /></td></tr>
<tr class="separator:a84dab4d2c56fedb624a01db170ba698c"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:abb128d8c30fd92d47110a3ca3499c5b2"><td class="memItemLeft" align="right" valign="top">void&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#abb128d8c30fd92d47110a3ca3499c5b2">ucsdet_setText</a> (<a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *ucsd, const char *textIn, int32_t len, <a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:abb128d8c30fd92d47110a3ca3499c5b2"><td class="mdescLeft">&#160;</td><td class="mdescRight">Set the input byte data whose charset is to detected.  <a href="#abb128d8c30fd92d47110a3ca3499c5b2">More...</a><br /></td></tr>
<tr class="separator:abb128d8c30fd92d47110a3ca3499c5b2"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:a94e2837151f289f01977a211c8a8e06f"><td class="memItemLeft" align="right" valign="top">void&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#a94e2837151f289f01977a211c8a8e06f">ucsdet_setDeclaredEncoding</a> (<a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *ucsd, const char *encoding, int32_t length, <a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:a94e2837151f289f01977a211c8a8e06f"><td class="mdescLeft">&#160;</td><td class="mdescRight">Set the declared encoding for charset detection.  <a href="#a94e2837151f289f01977a211c8a8e06f">More...</a><br /></td></tr>
<tr class="separator:a94e2837151f289f01977a211c8a8e06f"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:aff2633b5055d472cff4108d94f97cf7d"><td class="memItemLeft" align="right" valign="top">const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a> *&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#aff2633b5055d472cff4108d94f97cf7d">ucsdet_detect</a> (<a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *ucsd, <a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:aff2633b5055d472cff4108d94f97cf7d"><td class="mdescLeft">&#160;</td><td class="mdescRight">Return the charset that best matches the supplied input data.  <a href="#aff2633b5055d472cff4108d94f97cf7d">More...</a><br /></td></tr>
<tr class="separator:aff2633b5055d472cff4108d94f97cf7d"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:a307dfacd517a92891d1f98d513429bda"><td class="memItemLeft" align="right" valign="top">const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a> **&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#a307dfacd517a92891d1f98d513429bda">ucsdet_detectAll</a> (<a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *ucsd, int32_t *matchesFound, <a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:a307dfacd517a92891d1f98d513429bda"><td class="mdescLeft">&#160;</td><td class="mdescRight">Find all charset matches that appear to be consistent with the input, returning an array of results.  <a href="#a307dfacd517a92891d1f98d513429bda">More...</a><br /></td></tr>
<tr class="separator:a307dfacd517a92891d1f98d513429bda"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:ab9433e14dbe7704a4cf9b2b2f1a7377b"><td class="memItemLeft" align="right" valign="top">const char *&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#ab9433e14dbe7704a4cf9b2b2f1a7377b">ucsdet_getName</a> (const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a> *ucsm, <a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:ab9433e14dbe7704a4cf9b2b2f1a7377b"><td class="mdescLeft">&#160;</td><td class="mdescRight">Get the name of the charset represented by a UCharsetMatch.  <a href="#ab9433e14dbe7704a4cf9b2b2f1a7377b">More...</a><br /></td></tr>
<tr class="separator:ab9433e14dbe7704a4cf9b2b2f1a7377b"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:aa1dd7ce8c727d855697aac1f35df71ed"><td class="memItemLeft" align="right" valign="top">int32_t&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#aa1dd7ce8c727d855697aac1f35df71ed">ucsdet_getConfidence</a> (const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a> *ucsm, <a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:aa1dd7ce8c727d855697aac1f35df71ed"><td class="mdescLeft">&#160;</td><td class="mdescRight">Get a confidence number for the quality of the match of the byte data with the charset.  <a href="#aa1dd7ce8c727d855697aac1f35df71ed">More...</a><br /></td></tr>
<tr class="separator:aa1dd7ce8c727d855697aac1f35df71ed"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:a54b1e448b1d9cce1ac017962aaa801aa"><td class="memItemLeft" align="right" valign="top">const char *&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#a54b1e448b1d9cce1ac017962aaa801aa">ucsdet_getLanguage</a> (const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a> *ucsm, <a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:a54b1e448b1d9cce1ac017962aaa801aa"><td class="mdescLeft">&#160;</td><td class="mdescRight">Get the RFC 3066 code for the language of the input data.  <a href="#a54b1e448b1d9cce1ac017962aaa801aa">More...</a><br /></td></tr>
<tr class="separator:a54b1e448b1d9cce1ac017962aaa801aa"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:a30fd9ddb4090bd730caa49c22a3880e1"><td class="memItemLeft" align="right" valign="top">int32_t&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#a30fd9ddb4090bd730caa49c22a3880e1">ucsdet_getUChars</a> (const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a> *ucsm, <a class="el" href="umachine_8h.html#a6bb9fad572d65b305324ef288165e2ac">UChar</a> *buf, int32_t cap, <a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:a30fd9ddb4090bd730caa49c22a3880e1"><td class="mdescLeft">&#160;</td><td class="mdescRight">Get the entire input text as a UChar string, placing it into a caller-supplied buffer.  <a href="#a30fd9ddb4090bd730caa49c22a3880e1">More...</a><br /></td></tr>
<tr class="separator:a30fd9ddb4090bd730caa49c22a3880e1"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:a60dcfd7a2b826b995c86becf2f802016"><td class="memItemLeft" align="right" valign="top"><a class="el" href="uenum_8h.html#a32b7253b2148022535be36a9fcdb5a8d">UEnumeration</a> *&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#a60dcfd7a2b826b995c86becf2f802016">ucsdet_getAllDetectableCharsets</a> (const <a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *ucsd, <a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:a60dcfd7a2b826b995c86becf2f802016"><td class="mdescLeft">&#160;</td><td class="mdescRight">Get an iterator over the set of all detectable charsets - over the charsets that are known to the charset detection service.  <a href="#a60dcfd7a2b826b995c86becf2f802016">More...</a><br /></td></tr>
<tr class="separator:a60dcfd7a2b826b995c86becf2f802016"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:a04e3e10583476b1b53a677ebb5acfe67"><td class="memItemLeft" align="right" valign="top"><a class="el" href="umachine_8h.html#a349ef00011f20ccd1d3b424445681aa5">UBool</a>&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#a04e3e10583476b1b53a677ebb5acfe67">ucsdet_isInputFilterEnabled</a> (const <a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *ucsd)</td></tr>
<tr class="memdesc:a04e3e10583476b1b53a677ebb5acfe67"><td class="mdescLeft">&#160;</td><td class="mdescRight">Test whether input filtering is enabled for this charset detector.  <a href="#a04e3e10583476b1b53a677ebb5acfe67">More...</a><br /></td></tr>
<tr class="separator:a04e3e10583476b1b53a677ebb5acfe67"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:ad4911fca8b4685bba2c1b77ea2d2b535"><td class="memItemLeft" align="right" valign="top"><a class="el" href="umachine_8h.html#a349ef00011f20ccd1d3b424445681aa5">UBool</a>&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#ad4911fca8b4685bba2c1b77ea2d2b535">ucsdet_enableInputFilter</a> (<a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *ucsd, <a class="el" href="umachine_8h.html#a349ef00011f20ccd1d3b424445681aa5">UBool</a> filter)</td></tr>
<tr class="memdesc:ad4911fca8b4685bba2c1b77ea2d2b535"><td class="mdescLeft">&#160;</td><td class="mdescRight">Enable filtering of input text.  <a href="#ad4911fca8b4685bba2c1b77ea2d2b535">More...</a><br /></td></tr>
<tr class="separator:ad4911fca8b4685bba2c1b77ea2d2b535"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:a6675b4b134d4a466ccd404de5b786d54"><td class="memItemLeft" align="right" valign="top"><a class="el" href="uenum_8h.html#a32b7253b2148022535be36a9fcdb5a8d">UEnumeration</a> *&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#a6675b4b134d4a466ccd404de5b786d54">ucsdet_getDetectableCharsets</a> (const <a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *ucsd, <a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:a6675b4b134d4a466ccd404de5b786d54"><td class="mdescLeft">&#160;</td><td class="mdescRight">Get an iterator over the set of detectable charsets - over the charsets that are enabled by the specified charset detector.  <a href="#a6675b4b134d4a466ccd404de5b786d54">More...</a><br /></td></tr>
<tr class="separator:a6675b4b134d4a466ccd404de5b786d54"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:a8320689559aa9f530a8d44b6a0988ffe"><td class="memItemLeft" align="right" valign="top">void&#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="ucsdet_8h.html#a8320689559aa9f530a8d44b6a0988ffe">ucsdet_setDetectableCharset</a> (<a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *ucsd, const char *encoding, <a class="el" href="umachine_8h.html#a349ef00011f20ccd1d3b424445681aa5">UBool</a> enabled, <a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *status)</td></tr>
<tr class="memdesc:a8320689559aa9f530a8d44b6a0988ffe"><td class="mdescLeft">&#160;</td><td class="mdescRight">Enable or disable individual charset encoding.  <a href="#a8320689559aa9f530a8d44b6a0988ffe">More...</a><br /></td></tr>
<tr class="separator:a8320689559aa9f530a8d44b6a0988ffe"><td class="memSeparator" colspan="2">&#160;</td></tr>
</table>
<a name="details" id="details"></a><h2 class="groupheader">Detailed Description</h2>
<div class="textblock"><p>C API: Charset Detection API. </p>
<p>This API provides a facility for detecting the charset or encoding of character data in an unknown text format. The input data can be from an array of bytes. </p>
<p>Character set detection is at best an imprecise operation. The detection process will attempt to identify the charset that best matches the characteristics of the byte data, but the process is partly statistical in nature, and the results can not be guaranteed to always be correct. </p>
<p>For best accuracy in charset detection, the input data should be primarily in a single language, and a minimum of a few hundred bytes worth of plain text in the language are needed. The detection process will attempt to ignore html or xml style markup that could otherwise obscure the content. </p>

<p>Definition in file <a class="el" href="ucsdet_8h_source.html">ucsdet.h</a>.</p>
</div><h2 class="groupheader">Typedef Documentation</h2>
<a class="anchor" id="a8f341f9c43bf58b112afd70c8a94c45d"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">typedef struct <a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> <a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Structure representing a charset detector. </p>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable004999">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

<p>Definition at line <a class="el" href="ucsdet_8h_source.html#l00056">56</a> of file <a class="el" href="ucsdet_8h_source.html">ucsdet.h</a>.</p>

</div>
</div>
<a class="anchor" id="a4e40a6a6dae057f9257e144fc65ba667"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">typedef struct <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a> <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Opaque structure representing a match that was identified from a charset detection operation. </p>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005000">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

<p>Definition at line <a class="el" href="ucsdet_8h_source.html#l00064">64</a> of file <a class="el" href="ucsdet_8h_source.html">ucsdet.h</a>.</p>

</div>
</div>
<h2 class="groupheader">Function Documentation</h2>
<a class="anchor" id="a84dab4d2c56fedb624a01db170ba698c"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">void ucsdet_close </td>
          <td>(</td>
          <td class="paramtype"><a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *&#160;</td>
          <td class="paramname"><em>ucsd</em></td><td>)</td>
          <td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Close a charset detector. </p>
<p>All storage and any other resources owned by this charset detector will be released. Failure to close a charset detector when finished with it can result in memory leaks in the application.</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsd</td><td>The charset detector to be closed. </td></tr>
  </table>
  </dd>
</dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005002">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="aff2633b5055d472cff4108d94f97cf7d"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a>* ucsdet_detect </td>
          <td>(</td>
          <td class="paramtype"><a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *&#160;</td>
          <td class="paramname"><em>ucsd</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Return the charset that best matches the supplied input data. </p>
<p>Note though, that because the detection only looks at the start of the input data, there is a possibility that the returned charset will fail to handle the full set of input data. </p>
<p>The returned UCharsetMatch object is owned by the UCharsetDetector. It will remain valid until the detector input is reset, or until the detector is closed. </p>
<p>The function will fail if </p><ul>
<li>
no charset appears to match the data. </li>
<li>
no input text has been provided </li>
</ul>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsd</td><td>the charset detector to be used. </td></tr>
    <tr><td class="paramname">status</td><td>any error conditions are reported back in this variable. </td></tr>
  </table>
  </dd>
</dl>
<dl class="section return"><dt>Returns</dt><dd>a UCharsetMatch representing the best matching charset, or NULL if no charset matches the byte data.</dd></dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005005">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="a307dfacd517a92891d1f98d513429bda"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a>** ucsdet_detectAll </td>
          <td>(</td>
          <td class="paramtype"><a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *&#160;</td>
          <td class="paramname"><em>ucsd</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype">int32_t *&#160;</td>
          <td class="paramname"><em>matchesFound</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Find all charset matches that appear to be consistent with the input, returning an array of results. </p>
<p>The results are ordered with the best quality match first.</p>
<p>Because the detection only looks at a limited amount of the input byte data, some of the returned charsets may fail to handle the all of input data. </p>
<p>The returned UCharsetMatch objects are owned by the UCharsetDetector. They will remain valid until the detector is closed or modified</p>
<p>Return an error if </p><ul>
<li>
no charsets appear to match the input data. </li>
<li>
no input text has been provided </li>
</ul>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsd</td><td>the charset detector to be used. </td></tr>
    <tr><td class="paramname">matchesFound</td><td>pointer to a variable that will be set to the number of charsets identified that are consistent with the input data. Output only. </td></tr>
    <tr><td class="paramname">status</td><td>any error conditions are reported back in this variable. </td></tr>
  </table>
  </dd>
</dl>
<dl class="section return"><dt>Returns</dt><dd>A pointer to an array of pointers to UCharSetMatch objects. This array, and the UCharSetMatch instances to which it refers, are owned by the UCharsetDetector, and will remain valid until the detector is closed or modified. </dd></dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005006">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="ad4911fca8b4685bba2c1b77ea2d2b535"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname"><a class="el" href="umachine_8h.html#a349ef00011f20ccd1d3b424445681aa5">UBool</a> ucsdet_enableInputFilter </td>
          <td>(</td>
          <td class="paramtype"><a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *&#160;</td>
          <td class="paramname"><em>ucsd</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="umachine_8h.html#a349ef00011f20ccd1d3b424445681aa5">UBool</a>&#160;</td>
          <td class="paramname"><em>filter</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Enable filtering of input text. </p>
<p>If filtering is enabled, text within angle brackets ("&lt;" and "&gt;") will be removed before detection, which will remove most HTML or xml markup.</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsd</td><td>the charset detector to be modified. </td></tr>
    <tr><td class="paramname">filter</td><td><code>true</code> to enable input text filtering. </td></tr>
  </table>
  </dd>
</dl>
<dl class="section return"><dt>Returns</dt><dd>The previous setting.</dd></dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005013">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="a60dcfd7a2b826b995c86becf2f802016"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname"><a class="el" href="uenum_8h.html#a32b7253b2148022535be36a9fcdb5a8d">UEnumeration</a>* ucsdet_getAllDetectableCharsets </td>
          <td>(</td>
          <td class="paramtype">const <a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *&#160;</td>
          <td class="paramname"><em>ucsd</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Get an iterator over the set of all detectable charsets - over the charsets that are known to the charset detection service. </p>
<p>The returned UEnumeration provides access to the names of the charsets.</p>
<p>The state of the Charset detector that is passed in does not affect the result of this function, but requiring a valid, open charset detector as a parameter insures that the charset detection service has been safely initialized and that the required detection data is available.</p>
<p><b>Note:</b> Multiple different charset encodings in a same family may use a single shared name in this implementation. For example, this method returns an array including "ISO-8859-1" (ISO Latin 1), but not including "windows-1252" (Windows Latin 1). However, actual detection result could be "windows-1252" when the input data matches Latin 1 code points with any points only available in "windows-1252".</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsd</td><td>a Charset detector. </td></tr>
    <tr><td class="paramname">status</td><td>Any error conditions are reported back in this variable. </td></tr>
  </table>
  </dd>
</dl>
<dl class="section return"><dt>Returns</dt><dd>an iterator providing access to the detectable charset names. </dd></dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005011">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="aa1dd7ce8c727d855697aac1f35df71ed"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">int32_t ucsdet_getConfidence </td>
          <td>(</td>
          <td class="paramtype">const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a> *&#160;</td>
          <td class="paramname"><em>ucsm</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Get a confidence number for the quality of the match of the byte data with the charset. </p>
<p>Confidence numbers range from zero to 100, with 100 representing complete confidence and zero representing no confidence.</p>
<p>The confidence values are somewhat arbitrary. They define an an ordering within the results for any single detection operation but are not generally comparable between the results for different input.</p>
<p>A confidence value of ten does have a general meaning - it is used for charsets that can represent the input data, but for which there is no other indication that suggests that the charset is the correct one. Pure 7 bit ASCII data, for example, is compatible with a great many charsets, most of which will appear as possible matches with a confidence of 10.</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsm</td><td>The charset match object. </td></tr>
    <tr><td class="paramname">status</td><td>Any error conditions are reported back in this variable. </td></tr>
  </table>
  </dd>
</dl>
<dl class="section return"><dt>Returns</dt><dd>A confidence number for the charset match.</dd></dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005008">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="a6675b4b134d4a466ccd404de5b786d54"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname"><a class="el" href="uenum_8h.html#a32b7253b2148022535be36a9fcdb5a8d">UEnumeration</a>* ucsdet_getDetectableCharsets </td>
          <td>(</td>
          <td class="paramtype">const <a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *&#160;</td>
          <td class="paramname"><em>ucsd</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Get an iterator over the set of detectable charsets - over the charsets that are enabled by the specified charset detector. </p>
<p>The returned UEnumeration provides access to the names of the charsets.</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsd</td><td>a Charset detector. </td></tr>
    <tr><td class="paramname">status</td><td>Any error conditions are reported back in this variable. </td></tr>
  </table>
  </dd>
</dl>
<dl class="section return"><dt>Returns</dt><dd>an iterator providing access to the detectable charset names by the specified charset detector. </dd></dl>
<dl class="internal"><dt><b><a class="el" href="internal.html#_internal000470">Internal:</a></b></dt><dd>Do not use. This API is for internal use only. </dd></dl>

</div>
</div>
<a class="anchor" id="a54b1e448b1d9cce1ac017962aaa801aa"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">const char* ucsdet_getLanguage </td>
          <td>(</td>
          <td class="paramtype">const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a> *&#160;</td>
          <td class="paramname"><em>ucsm</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Get the RFC 3066 code for the language of the input data. </p>
<p>The Charset Detection service is intended primarily for detecting charsets, not language. For some, but not all, charsets, a language is identified as a byproduct of the detection process, and that is what is returned by this function.</p>
<p>CAUTION:</p><ol type="1">
<li>Language information is not available for input data encoded in all charsets. In particular, no language is identified for UTF-8 input data.</li>
<li>Closely related languages may sometimes be confused.</li>
</ol>
<p>If more accurate language detection is required, a linguistic analysis package should be used.</p>
<p>The storage for the returned name string is owned by the UCharsetMatch, and will remain valid while the UCharsetMatch is valid.</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsm</td><td>The charset match object. </td></tr>
    <tr><td class="paramname">status</td><td>Any error conditions are reported back in this variable. </td></tr>
  </table>
  </dd>
</dl>
<dl class="section return"><dt>Returns</dt><dd>The RFC 3066 code for the language of the input data, or an empty string if the language could not be determined.</dd></dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005009">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="ab9433e14dbe7704a4cf9b2b2f1a7377b"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">const char* ucsdet_getName </td>
          <td>(</td>
          <td class="paramtype">const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a> *&#160;</td>
          <td class="paramname"><em>ucsm</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Get the name of the charset represented by a UCharsetMatch. </p>
<p>The storage for the returned name string is owned by the UCharsetMatch, and will remain valid while the UCharsetMatch is valid.</p>
<p>The name returned is suitable for use with the ICU conversion APIs.</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsm</td><td>The charset match object. </td></tr>
    <tr><td class="paramname">status</td><td>Any error conditions are reported back in this variable. </td></tr>
  </table>
  </dd>
</dl>
<dl class="section return"><dt>Returns</dt><dd>The name of the matching charset.</dd></dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005007">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="a30fd9ddb4090bd730caa49c22a3880e1"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">int32_t ucsdet_getUChars </td>
          <td>(</td>
          <td class="paramtype">const <a class="el" href="ucsdet_8h.html#a4e40a6a6dae057f9257e144fc65ba667">UCharsetMatch</a> *&#160;</td>
          <td class="paramname"><em>ucsm</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="umachine_8h.html#a6bb9fad572d65b305324ef288165e2ac">UChar</a> *&#160;</td>
          <td class="paramname"><em>buf</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype">int32_t&#160;</td>
          <td class="paramname"><em>cap</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Get the entire input text as a UChar string, placing it into a caller-supplied buffer. </p>
<p>A terminating NUL character will be appended to the buffer if space is available.</p>
<p>The number of UChars in the output string, not including the terminating NUL, is returned.</p>
<p>If the supplied buffer is smaller than required to hold the output, the contents of the buffer are undefined. The full output string length (in UChars) is returned as always, and can be used to allocate a buffer of the correct size.</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsm</td><td>The charset match object. </td></tr>
    <tr><td class="paramname">buf</td><td>A UChar buffer to be filled with the converted text data. </td></tr>
    <tr><td class="paramname">cap</td><td>The capacity of the buffer in UChars. </td></tr>
    <tr><td class="paramname">status</td><td>Any error conditions are reported back in this variable. </td></tr>
  </table>
  </dd>
</dl>
<dl class="section return"><dt>Returns</dt><dd>The number of UChars in the output string.</dd></dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005010">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="a04e3e10583476b1b53a677ebb5acfe67"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname"><a class="el" href="umachine_8h.html#a349ef00011f20ccd1d3b424445681aa5">UBool</a> ucsdet_isInputFilterEnabled </td>
          <td>(</td>
          <td class="paramtype">const <a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *&#160;</td>
          <td class="paramname"><em>ucsd</em></td><td>)</td>
          <td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Test whether input filtering is enabled for this charset detector. </p>
<p>Input filtering removes text that appears to be HTML or xml markup from the input before applying the code page detection heuristics.</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsd</td><td>The charset detector to check. </td></tr>
  </table>
  </dd>
</dl>
<dl class="section return"><dt>Returns</dt><dd>TRUE if filtering is enabled. </dd></dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005012">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="abf2d3c7b731982895433cfbeb6c29cdd"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname"><a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a>* ucsdet_open </td>
          <td>(</td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em></td><td>)</td>
          <td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Open a charset detector. </p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">status</td><td>Any error conditions occurring during the open operation are reported back in this variable. </td></tr>
  </table>
  </dd>
</dl>
<dl class="section return"><dt>Returns</dt><dd>the newly opened charset detector. </dd></dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005001">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="a94e2837151f289f01977a211c8a8e06f"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">void ucsdet_setDeclaredEncoding </td>
          <td>(</td>
          <td class="paramtype"><a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *&#160;</td>
          <td class="paramname"><em>ucsd</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype">const char *&#160;</td>
          <td class="paramname"><em>encoding</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype">int32_t&#160;</td>
          <td class="paramname"><em>length</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Set the declared encoding for charset detection. </p>
<p>The declared encoding of an input text is an encoding obtained by the user from an http header or xml declaration or similar source that can be provided as an additional hint to the charset detector.</p>
<p>How and whether the declared encoding will be used during the detection process is TBD.</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsd</td><td>the charset detector to be used. </td></tr>
    <tr><td class="paramname">encoding</td><td>an encoding for the current data obtained from a header or declaration or other source outside of the byte data itself. </td></tr>
    <tr><td class="paramname">length</td><td>the length of the encoding name, or -1 if the name string is NUL terminated. </td></tr>
    <tr><td class="paramname">status</td><td>any error conditions are reported back in this variable.</td></tr>
  </table>
  </dd>
</dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005004">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
<a class="anchor" id="a8320689559aa9f530a8d44b6a0988ffe"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">void ucsdet_setDetectableCharset </td>
          <td>(</td>
          <td class="paramtype"><a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *&#160;</td>
          <td class="paramname"><em>ucsd</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype">const char *&#160;</td>
          <td class="paramname"><em>encoding</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="umachine_8h.html#a349ef00011f20ccd1d3b424445681aa5">UBool</a>&#160;</td>
          <td class="paramname"><em>enabled</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Enable or disable individual charset encoding. </p>
<p>A name of charset encoding must be included in the names returned by <a class="el" href="">getAllDetectableCharsets()</a>.</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsd</td><td>a Charset detector. </td></tr>
    <tr><td class="paramname">encoding</td><td>encoding the name of charset encoding. </td></tr>
    <tr><td class="paramname">enabled</td><td><code>TRUE</code> to enable, or <code>FALSE</code> to disable the charset encoding. </td></tr>
    <tr><td class="paramname">status</td><td>receives the return status. When the name of charset encoding is not supported, U_ILLEGAL_ARGUMENT_ERROR is set. </td></tr>
  </table>
  </dd>
</dl>
<dl class="internal"><dt><b><a class="el" href="internal.html#_internal000471">Internal:</a></b></dt><dd>Do not use. This API is for internal use only. </dd></dl>

</div>
</div>
<a class="anchor" id="abb128d8c30fd92d47110a3ca3499c5b2"></a>
<div class="memitem">
<div class="memproto">
      <table class="memname">
        <tr>
          <td class="memname">void ucsdet_setText </td>
          <td>(</td>
          <td class="paramtype"><a class="el" href="ucsdet_8h.html#a8f341f9c43bf58b112afd70c8a94c45d">UCharsetDetector</a> *&#160;</td>
          <td class="paramname"><em>ucsd</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype">const char *&#160;</td>
          <td class="paramname"><em>textIn</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype">int32_t&#160;</td>
          <td class="paramname"><em>len</em>, </td>
        </tr>
        <tr>
          <td class="paramkey"></td>
          <td></td>
          <td class="paramtype"><a class="el" href="utypes_8h.html#a3343c1c8a8377277046774691c98d78c">UErrorCode</a> *&#160;</td>
          <td class="paramname"><em>status</em>&#160;</td>
        </tr>
        <tr>
          <td></td>
          <td>)</td>
          <td></td><td></td>
        </tr>
      </table>
</div><div class="memdoc">

<p>Set the input byte data whose charset is to detected. </p>
<p>Ownership of the input text byte array remains with the caller. The input string must not be altered or deleted until the charset detector is either closed or reset to refer to different input text.</p>
<dl class="params"><dt>Parameters</dt><dd>
  <table class="params">
    <tr><td class="paramname">ucsd</td><td>the charset detector to be used. </td></tr>
    <tr><td class="paramname">textIn</td><td>the input text of unknown encoding. . </td></tr>
    <tr><td class="paramname">len</td><td>the length of the input text, or -1 if the text is NUL terminated. </td></tr>
    <tr><td class="paramname">status</td><td>any error conditions are reported back in this variable.</td></tr>
  </table>
  </dd>
</dl>
<dl class="stable"><dt><b><a class="el" href="stable.html#_stable005003">Stable:</a></b></dt><dd>ICU 3.6 </dd></dl>

</div>
</div>
</div><!-- contents -->
<!-- start footer part -->
<hr class="footer"/><address class="footer"><small>
Generated by &#160;<a href="http://www.doxygen.org/index.html">
<img class="footer" src="doxygen.png" alt="doxygen"/>
</a> 1.8.11
</small></address>
</body>
</html>