This file is indexed.

/usr/share/opencc/doc/html/_u_t_f8_util_8hpp_source.html is in libopencc2-data 1.0.4-5.

This file is owned by root:root, with mode 0o644.

The actual contents of the file can be viewed below.

 1
 2
 3
 4
 5
 6
 7
 8
 9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
<meta name="generator" content="Doxygen 1.8.13"/>
<meta name="viewport" content="width=device-width, initial-scale=1"/>
<title>Open Chinese Convert: UTF8Util.hpp Source File</title>
<link href="tabs.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="jquery.js"></script>
<script type="text/javascript" src="dynsections.js"></script>
<link href="search/search.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="search/searchdata.js"></script>
<script type="text/javascript" src="search/search.js"></script>
<link href="doxygen.css" rel="stylesheet" type="text/css" />
</head>
<body>
<div id="top"><!-- do not remove this div, it is closed by doxygen! -->
<div id="titlearea">
<table cellspacing="0" cellpadding="0">
 <tbody>
 <tr style="height: 56px;">
  <td id="projectalign" style="padding-left: 0.5em;">
   <div id="projectname">Open Chinese Convert
   &#160;<span id="projectnumber">1.0.4</span>
   </div>
   <div id="projectbrief">A project for conversion between Traditional and Simplified Chinese</div>
  </td>
 </tr>
 </tbody>
</table>
</div>
<!-- end header part -->
<!-- Generated by Doxygen 1.8.13 -->
<script type="text/javascript">
var searchBox = new SearchBox("searchBox", "search",false,'Search');
</script>
<script type="text/javascript" src="menudata.js"></script>
<script type="text/javascript" src="menu.js"></script>
<script type="text/javascript">
$(function() {
  initMenu('',true,false,'search.php','Search');
  $(document).ready(function() { init_search(); });
});
</script>
<div id="main-nav"></div>
<!-- window showing the filter options -->
<div id="MSearchSelectWindow"
     onmouseover="return searchBox.OnSearchSelectShow()"
     onmouseout="return searchBox.OnSearchSelectHide()"
     onkeydown="return searchBox.OnSearchSelectKey(event)">
</div>

<!-- iframe showing the search results (closed by default) -->
<div id="MSearchResultsWindow">
<iframe src="javascript:void(0)" frameborder="0" 
        name="MSearchResults" id="MSearchResults">
</iframe>
</div>

<div id="nav-path" class="navpath">
  <ul>
<li class="navelem"><a class="el" href="dir_68267d1309a1af8e8297ef4c3efbcdba.html">src</a></li>  </ul>
</div>
</div><!-- top -->
<div class="header">
  <div class="headertitle">
<div class="title">UTF8Util.hpp</div>  </div>
</div><!--header-->
<div class="contents">
<div class="fragment"><div class="line"><a name="l00001"></a><span class="lineno">    1</span>&#160;<span class="comment">/*</span></div><div class="line"><a name="l00002"></a><span class="lineno">    2</span>&#160;<span class="comment"> * Open Chinese Convert</span></div><div class="line"><a name="l00003"></a><span class="lineno">    3</span>&#160;<span class="comment"> *</span></div><div class="line"><a name="l00004"></a><span class="lineno">    4</span>&#160;<span class="comment"> * Copyright 2013 BYVoid &lt;byvoid@byvoid.com&gt;</span></div><div class="line"><a name="l00005"></a><span class="lineno">    5</span>&#160;<span class="comment"> *</span></div><div class="line"><a name="l00006"></a><span class="lineno">    6</span>&#160;<span class="comment"> * Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);</span></div><div class="line"><a name="l00007"></a><span class="lineno">    7</span>&#160;<span class="comment"> * you may not use this file except in compliance with the License.</span></div><div class="line"><a name="l00008"></a><span class="lineno">    8</span>&#160;<span class="comment"> * You may obtain a copy of the License at</span></div><div class="line"><a name="l00009"></a><span class="lineno">    9</span>&#160;<span class="comment"> *</span></div><div class="line"><a name="l00010"></a><span class="lineno">   10</span>&#160;<span class="comment"> *      http://www.apache.org/licenses/LICENSE-2.0</span></div><div class="line"><a name="l00011"></a><span class="lineno">   11</span>&#160;<span class="comment"> *</span></div><div class="line"><a name="l00012"></a><span class="lineno">   12</span>&#160;<span class="comment"> * Unless required by applicable law or agreed to in writing, software</span></div><div class="line"><a name="l00013"></a><span class="lineno">   13</span>&#160;<span class="comment"> * distributed under the License is distributed on an &quot;AS IS&quot; BASIS,</span></div><div class="line"><a name="l00014"></a><span class="lineno">   14</span>&#160;<span class="comment"> * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.</span></div><div class="line"><a name="l00015"></a><span class="lineno">   15</span>&#160;<span class="comment"> * See the License for the specific language governing permissions and</span></div><div class="line"><a name="l00016"></a><span class="lineno">   16</span>&#160;<span class="comment"> * limitations under the License.</span></div><div class="line"><a name="l00017"></a><span class="lineno">   17</span>&#160;<span class="comment"> */</span></div><div class="line"><a name="l00018"></a><span class="lineno">   18</span>&#160;</div><div class="line"><a name="l00019"></a><span class="lineno">   19</span>&#160;<span class="preprocessor">#pragma once</span></div><div class="line"><a name="l00020"></a><span class="lineno">   20</span>&#160;</div><div class="line"><a name="l00021"></a><span class="lineno">   21</span>&#160;<span class="preprocessor">#ifdef _MSC_VER</span></div><div class="line"><a name="l00022"></a><span class="lineno">   22</span>&#160;<span class="preprocessor">#define NOMINMAX</span></div><div class="line"><a name="l00023"></a><span class="lineno">   23</span>&#160;<span class="preprocessor">#include &lt;Windows.h&gt;</span></div><div class="line"><a name="l00024"></a><span class="lineno">   24</span>&#160;<span class="preprocessor">#undef NOMINMAX</span></div><div class="line"><a name="l00025"></a><span class="lineno">   25</span>&#160;<span class="preprocessor">#endif // _MSC_VER</span></div><div class="line"><a name="l00026"></a><span class="lineno">   26</span>&#160;</div><div class="line"><a name="l00027"></a><span class="lineno">   27</span>&#160;<span class="preprocessor">#include &quot;Common.hpp&quot;</span></div><div class="line"><a name="l00028"></a><span class="lineno">   28</span>&#160;</div><div class="line"><a name="l00029"></a><span class="lineno">   29</span>&#160;<span class="keyword">namespace </span><a class="code" href="namespaceopencc.html">opencc</a> {</div><div class="line"><a name="l00034"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html">   34</a></span>&#160;<span class="keyword">class </span>OPENCC_EXPORT <a class="code" href="classopencc_1_1_u_t_f8_util.html">UTF8Util</a> {</div><div class="line"><a name="l00035"></a><span class="lineno">   35</span>&#160;<span class="keyword">public</span>:</div><div class="line"><a name="l00039"></a><span class="lineno">   39</span>&#160;  <span class="keyword">static</span> <span class="keywordtype">void</span> SkipUtf8Bom(FILE* fp);</div><div class="line"><a name="l00040"></a><span class="lineno">   40</span>&#160;</div><div class="line"><a name="l00045"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#a7741e8ca4c6ad9e4f68b9d4633b58def">   45</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">size_t</span> <a class="code" href="classopencc_1_1_u_t_f8_util.html#a7741e8ca4c6ad9e4f68b9d4633b58def">NextCharLengthNoException</a>(<span class="keyword">const</span> <span class="keywordtype">char</span>* str) {</div><div class="line"><a name="l00046"></a><span class="lineno">   46</span>&#160;    <span class="keywordtype">char</span> ch = *str;</div><div class="line"><a name="l00047"></a><span class="lineno">   47</span>&#160;    <span class="keywordflow">if</span> ((ch &amp; 0xF0) == 0xE0) {</div><div class="line"><a name="l00048"></a><span class="lineno">   48</span>&#160;      <span class="keywordflow">return</span> 3;</div><div class="line"><a name="l00049"></a><span class="lineno">   49</span>&#160;    } <span class="keywordflow">else</span> <span class="keywordflow">if</span> ((ch &amp; 0x80) == 0x00) {</div><div class="line"><a name="l00050"></a><span class="lineno">   50</span>&#160;      <span class="keywordflow">return</span> 1;</div><div class="line"><a name="l00051"></a><span class="lineno">   51</span>&#160;    } <span class="keywordflow">else</span> <span class="keywordflow">if</span> ((ch &amp; 0xE0) == 0xC0) {</div><div class="line"><a name="l00052"></a><span class="lineno">   52</span>&#160;      <span class="keywordflow">return</span> 2;</div><div class="line"><a name="l00053"></a><span class="lineno">   53</span>&#160;    } <span class="keywordflow">else</span> <span class="keywordflow">if</span> ((ch &amp; 0xF8) == 0xF0) {</div><div class="line"><a name="l00054"></a><span class="lineno">   54</span>&#160;      <span class="keywordflow">return</span> 4;</div><div class="line"><a name="l00055"></a><span class="lineno">   55</span>&#160;    } <span class="keywordflow">else</span> <span class="keywordflow">if</span> ((ch &amp; 0xFC) == 0xF8) {</div><div class="line"><a name="l00056"></a><span class="lineno">   56</span>&#160;      <span class="keywordflow">return</span> 5;</div><div class="line"><a name="l00057"></a><span class="lineno">   57</span>&#160;    } <span class="keywordflow">else</span> <span class="keywordflow">if</span> ((ch &amp; 0xFE) == 0xFC) {</div><div class="line"><a name="l00058"></a><span class="lineno">   58</span>&#160;      <span class="keywordflow">return</span> 6;</div><div class="line"><a name="l00059"></a><span class="lineno">   59</span>&#160;    }</div><div class="line"><a name="l00060"></a><span class="lineno">   60</span>&#160;    <span class="keywordflow">return</span> 0;</div><div class="line"><a name="l00061"></a><span class="lineno">   61</span>&#160;  }</div><div class="line"><a name="l00062"></a><span class="lineno">   62</span>&#160;</div><div class="line"><a name="l00066"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#ae71013ee7dfef2aba9e99dbae8f24bbd">   66</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">size_t</span> <a class="code" href="classopencc_1_1_u_t_f8_util.html#ae71013ee7dfef2aba9e99dbae8f24bbd">NextCharLength</a>(<span class="keyword">const</span> <span class="keywordtype">char</span>* str) {</div><div class="line"><a name="l00067"></a><span class="lineno">   67</span>&#160;    <span class="keywordtype">size_t</span> length = NextCharLengthNoException(str);</div><div class="line"><a name="l00068"></a><span class="lineno">   68</span>&#160;    <span class="keywordflow">if</span> (length == 0) {</div><div class="line"><a name="l00069"></a><span class="lineno">   69</span>&#160;      <span class="keywordflow">throw</span> <a class="code" href="classopencc_1_1_invalid_u_t_f8.html">InvalidUTF8</a>(str);</div><div class="line"><a name="l00070"></a><span class="lineno">   70</span>&#160;    }</div><div class="line"><a name="l00071"></a><span class="lineno">   71</span>&#160;    <span class="keywordflow">return</span> length;</div><div class="line"><a name="l00072"></a><span class="lineno">   72</span>&#160;  }</div><div class="line"><a name="l00073"></a><span class="lineno">   73</span>&#160;</div><div class="line"><a name="l00077"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#a153a270ce21d855c07a7d5eba397da5e">   77</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">size_t</span> <a class="code" href="classopencc_1_1_u_t_f8_util.html#a153a270ce21d855c07a7d5eba397da5e">PrevCharLength</a>(<span class="keyword">const</span> <span class="keywordtype">char</span>* str) {</div><div class="line"><a name="l00078"></a><span class="lineno">   78</span>&#160;    {</div><div class="line"><a name="l00079"></a><span class="lineno">   79</span>&#160;      <span class="keyword">const</span> <span class="keywordtype">size_t</span> length = NextCharLengthNoException(str - 3);</div><div class="line"><a name="l00080"></a><span class="lineno">   80</span>&#160;      <span class="keywordflow">if</span> (length == 3) {</div><div class="line"><a name="l00081"></a><span class="lineno">   81</span>&#160;        <span class="keywordflow">return</span> length;</div><div class="line"><a name="l00082"></a><span class="lineno">   82</span>&#160;      }</div><div class="line"><a name="l00083"></a><span class="lineno">   83</span>&#160;    }</div><div class="line"><a name="l00084"></a><span class="lineno">   84</span>&#160;    {</div><div class="line"><a name="l00085"></a><span class="lineno">   85</span>&#160;      <span class="keyword">const</span> <span class="keywordtype">size_t</span> length = NextCharLengthNoException(str - 1);</div><div class="line"><a name="l00086"></a><span class="lineno">   86</span>&#160;      <span class="keywordflow">if</span> (length == 1) {</div><div class="line"><a name="l00087"></a><span class="lineno">   87</span>&#160;        <span class="keywordflow">return</span> length;</div><div class="line"><a name="l00088"></a><span class="lineno">   88</span>&#160;      }</div><div class="line"><a name="l00089"></a><span class="lineno">   89</span>&#160;    }</div><div class="line"><a name="l00090"></a><span class="lineno">   90</span>&#160;    {</div><div class="line"><a name="l00091"></a><span class="lineno">   91</span>&#160;      <span class="keyword">const</span> <span class="keywordtype">size_t</span> length = NextCharLengthNoException(str - 2);</div><div class="line"><a name="l00092"></a><span class="lineno">   92</span>&#160;      <span class="keywordflow">if</span> (length == 2) {</div><div class="line"><a name="l00093"></a><span class="lineno">   93</span>&#160;        <span class="keywordflow">return</span> length;</div><div class="line"><a name="l00094"></a><span class="lineno">   94</span>&#160;      }</div><div class="line"><a name="l00095"></a><span class="lineno">   95</span>&#160;    }</div><div class="line"><a name="l00096"></a><span class="lineno">   96</span>&#160;    <span class="keywordflow">for</span> (<span class="keywordtype">size_t</span> i = 4; i &lt;= 6; i++) {</div><div class="line"><a name="l00097"></a><span class="lineno">   97</span>&#160;      <span class="keyword">const</span> <span class="keywordtype">size_t</span> length = NextCharLengthNoException(str - i);</div><div class="line"><a name="l00098"></a><span class="lineno">   98</span>&#160;      <span class="keywordflow">if</span> (length == i) {</div><div class="line"><a name="l00099"></a><span class="lineno">   99</span>&#160;        <span class="keywordflow">return</span> length;</div><div class="line"><a name="l00100"></a><span class="lineno">  100</span>&#160;      }</div><div class="line"><a name="l00101"></a><span class="lineno">  101</span>&#160;    }</div><div class="line"><a name="l00102"></a><span class="lineno">  102</span>&#160;    <span class="keywordflow">throw</span> <a class="code" href="classopencc_1_1_invalid_u_t_f8.html">InvalidUTF8</a>(str);</div><div class="line"><a name="l00103"></a><span class="lineno">  103</span>&#160;  }</div><div class="line"><a name="l00104"></a><span class="lineno">  104</span>&#160;</div><div class="line"><a name="l00108"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#ae26e05a30598021e204448ea71971208">  108</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* <a class="code" href="classopencc_1_1_u_t_f8_util.html#ae26e05a30598021e204448ea71971208">NextChar</a>(<span class="keyword">const</span> <span class="keywordtype">char</span>* str) {</div><div class="line"><a name="l00109"></a><span class="lineno">  109</span>&#160;    <span class="keywordflow">return</span> str + NextCharLength(str);</div><div class="line"><a name="l00110"></a><span class="lineno">  110</span>&#160;  }</div><div class="line"><a name="l00111"></a><span class="lineno">  111</span>&#160;</div><div class="line"><a name="l00115"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#ab6031f3d1a95f66c51a142d5c2794614">  115</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* <a class="code" href="classopencc_1_1_u_t_f8_util.html#ab6031f3d1a95f66c51a142d5c2794614">PrevChar</a>(<span class="keyword">const</span> <span class="keywordtype">char</span>* str) {</div><div class="line"><a name="l00116"></a><span class="lineno">  116</span>&#160;    <span class="keywordflow">return</span> str - PrevCharLength(str);</div><div class="line"><a name="l00117"></a><span class="lineno">  117</span>&#160;  }</div><div class="line"><a name="l00118"></a><span class="lineno">  118</span>&#160;</div><div class="line"><a name="l00122"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#ac0642244a71d77d3e79829a7952f9b86">  122</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">size_t</span> <a class="code" href="classopencc_1_1_u_t_f8_util.html#ac0642244a71d77d3e79829a7952f9b86">Length</a>(<span class="keyword">const</span> <span class="keywordtype">char</span>* str) {</div><div class="line"><a name="l00123"></a><span class="lineno">  123</span>&#160;    <span class="keywordtype">size_t</span> length = 0;</div><div class="line"><a name="l00124"></a><span class="lineno">  124</span>&#160;    <span class="keywordflow">while</span> (*str != <span class="charliteral">&#39;\0&#39;</span>) {</div><div class="line"><a name="l00125"></a><span class="lineno">  125</span>&#160;      str = NextChar(str);</div><div class="line"><a name="l00126"></a><span class="lineno">  126</span>&#160;      length++;</div><div class="line"><a name="l00127"></a><span class="lineno">  127</span>&#160;    }</div><div class="line"><a name="l00128"></a><span class="lineno">  128</span>&#160;    <span class="keywordflow">return</span> length;</div><div class="line"><a name="l00129"></a><span class="lineno">  129</span>&#160;  }</div><div class="line"><a name="l00130"></a><span class="lineno">  130</span>&#160;</div><div class="line"><a name="l00137"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#a3c9791916dd617caa7eef44a67900c20">  137</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* <a class="code" href="classopencc_1_1_u_t_f8_util.html#a3c9791916dd617caa7eef44a67900c20">FindNextInline</a>(<span class="keyword">const</span> <span class="keywordtype">char</span>* str, <span class="keyword">const</span> <span class="keywordtype">char</span> ch) {</div><div class="line"><a name="l00138"></a><span class="lineno">  138</span>&#160;    <span class="keywordflow">while</span> (!IsLineEndingOrFileEnding(*str) &amp;&amp; *str != ch) {</div><div class="line"><a name="l00139"></a><span class="lineno">  139</span>&#160;      str = NextChar(str);</div><div class="line"><a name="l00140"></a><span class="lineno">  140</span>&#160;    }</div><div class="line"><a name="l00141"></a><span class="lineno">  141</span>&#160;    <span class="keywordflow">return</span> str;</div><div class="line"><a name="l00142"></a><span class="lineno">  142</span>&#160;  }</div><div class="line"><a name="l00143"></a><span class="lineno">  143</span>&#160;</div><div class="line"><a name="l00147"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#a008b85311545f43a7a3c14e304004266">  147</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">bool</span> <a class="code" href="classopencc_1_1_u_t_f8_util.html#a008b85311545f43a7a3c14e304004266">IsLineEndingOrFileEnding</a>(<span class="keyword">const</span> <span class="keywordtype">char</span> ch) {</div><div class="line"><a name="l00148"></a><span class="lineno">  148</span>&#160;    <span class="keywordflow">return</span> ch == <span class="charliteral">&#39;\0&#39;</span> || ch == <span class="charliteral">&#39;\n&#39;</span> || ch == <span class="charliteral">&#39;\r&#39;</span>;</div><div class="line"><a name="l00149"></a><span class="lineno">  149</span>&#160;  }</div><div class="line"><a name="l00150"></a><span class="lineno">  150</span>&#160;</div><div class="line"><a name="l00154"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#afefc07b662cd10ebe998685e2ce3b72d">  154</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">string</span> <a class="code" href="classopencc_1_1_u_t_f8_util.html#afefc07b662cd10ebe998685e2ce3b72d">FromSubstr</a>(<span class="keyword">const</span> <span class="keywordtype">char</span>* str, <span class="keywordtype">size_t</span> length) {</div><div class="line"><a name="l00155"></a><span class="lineno">  155</span>&#160;    <span class="keywordtype">string</span> newStr;</div><div class="line"><a name="l00156"></a><span class="lineno">  156</span>&#160;    newStr.resize(length);</div><div class="line"><a name="l00157"></a><span class="lineno">  157</span>&#160;    strncpy(const_cast&lt;char*&gt;(newStr.c_str()), str, length);</div><div class="line"><a name="l00158"></a><span class="lineno">  158</span>&#160;    <span class="keywordflow">return</span> newStr;</div><div class="line"><a name="l00159"></a><span class="lineno">  159</span>&#160;  }</div><div class="line"><a name="l00160"></a><span class="lineno">  160</span>&#160;</div><div class="line"><a name="l00164"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#a8ee1ac13118c59a357114782d18a3497">  164</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">bool</span> <a class="code" href="classopencc_1_1_u_t_f8_util.html#a8ee1ac13118c59a357114782d18a3497">NotShorterThan</a>(<span class="keyword">const</span> <span class="keywordtype">char</span>* str, <span class="keywordtype">size_t</span> byteLength) {</div><div class="line"><a name="l00165"></a><span class="lineno">  165</span>&#160;    <span class="keywordflow">while</span> (byteLength &gt; 0) {</div><div class="line"><a name="l00166"></a><span class="lineno">  166</span>&#160;      <span class="keywordflow">if</span> (*str == <span class="charliteral">&#39;\0&#39;</span>) {</div><div class="line"><a name="l00167"></a><span class="lineno">  167</span>&#160;        <span class="keywordflow">return</span> <span class="keyword">false</span>;</div><div class="line"><a name="l00168"></a><span class="lineno">  168</span>&#160;      }</div><div class="line"><a name="l00169"></a><span class="lineno">  169</span>&#160;      byteLength--;</div><div class="line"><a name="l00170"></a><span class="lineno">  170</span>&#160;      str++;</div><div class="line"><a name="l00171"></a><span class="lineno">  171</span>&#160;    }</div><div class="line"><a name="l00172"></a><span class="lineno">  172</span>&#160;    <span class="keywordflow">return</span> <span class="keyword">true</span>;</div><div class="line"><a name="l00173"></a><span class="lineno">  173</span>&#160;  }</div><div class="line"><a name="l00174"></a><span class="lineno">  174</span>&#160;</div><div class="line"><a name="l00179"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#ae212d8ca540b33752e2ff373f842479c">  179</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">string</span> <a class="code" href="classopencc_1_1_u_t_f8_util.html#ae212d8ca540b33752e2ff373f842479c">TruncateUTF8</a>(<span class="keyword">const</span> <span class="keywordtype">char</span>* str, <span class="keywordtype">size_t</span> maxByteLength) {</div><div class="line"><a name="l00180"></a><span class="lineno">  180</span>&#160;    <span class="keywordtype">string</span> wordTrunc;</div><div class="line"><a name="l00181"></a><span class="lineno">  181</span>&#160;    <span class="keywordflow">if</span> (NotShorterThan(str, maxByteLength)) {</div><div class="line"><a name="l00182"></a><span class="lineno">  182</span>&#160;      <span class="keywordtype">size_t</span> len = 0;</div><div class="line"><a name="l00183"></a><span class="lineno">  183</span>&#160;      <span class="keyword">const</span> <span class="keywordtype">char</span>* pStr = str;</div><div class="line"><a name="l00184"></a><span class="lineno">  184</span>&#160;      <span class="keywordflow">for</span> (;;) {</div><div class="line"><a name="l00185"></a><span class="lineno">  185</span>&#160;        <span class="keyword">const</span> <span class="keywordtype">size_t</span> charLength = NextCharLength(pStr);</div><div class="line"><a name="l00186"></a><span class="lineno">  186</span>&#160;        <span class="keywordflow">if</span> (len + charLength &gt; maxByteLength) {</div><div class="line"><a name="l00187"></a><span class="lineno">  187</span>&#160;          <span class="keywordflow">break</span>;</div><div class="line"><a name="l00188"></a><span class="lineno">  188</span>&#160;        }</div><div class="line"><a name="l00189"></a><span class="lineno">  189</span>&#160;        pStr += charLength;</div><div class="line"><a name="l00190"></a><span class="lineno">  190</span>&#160;        len += charLength;</div><div class="line"><a name="l00191"></a><span class="lineno">  191</span>&#160;      }</div><div class="line"><a name="l00192"></a><span class="lineno">  192</span>&#160;      wordTrunc = FromSubstr(str, len);</div><div class="line"><a name="l00193"></a><span class="lineno">  193</span>&#160;    } <span class="keywordflow">else</span> {</div><div class="line"><a name="l00194"></a><span class="lineno">  194</span>&#160;      wordTrunc = str;</div><div class="line"><a name="l00195"></a><span class="lineno">  195</span>&#160;    }</div><div class="line"><a name="l00196"></a><span class="lineno">  196</span>&#160;    <span class="keywordflow">return</span> wordTrunc;</div><div class="line"><a name="l00197"></a><span class="lineno">  197</span>&#160;  }</div><div class="line"><a name="l00198"></a><span class="lineno">  198</span>&#160;</div><div class="line"><a name="l00202"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#af2cf133ab5574e3267a8726a5b766a9d">  202</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">void</span> <a class="code" href="classopencc_1_1_u_t_f8_util.html#af2cf133ab5574e3267a8726a5b766a9d">ReplaceAll</a>(<span class="keywordtype">string</span>&amp; str, <span class="keyword">const</span> <span class="keywordtype">char</span>* from, <span class="keyword">const</span> <span class="keywordtype">char</span>* to) {</div><div class="line"><a name="l00203"></a><span class="lineno">  203</span>&#160;    string::size_type pos = 0;</div><div class="line"><a name="l00204"></a><span class="lineno">  204</span>&#160;    string::size_type fromLen = strlen(from);</div><div class="line"><a name="l00205"></a><span class="lineno">  205</span>&#160;    string::size_type toLen = strlen(to);</div><div class="line"><a name="l00206"></a><span class="lineno">  206</span>&#160;    <span class="keywordflow">while</span> ((pos = str.find(from, pos)) != string::npos) {</div><div class="line"><a name="l00207"></a><span class="lineno">  207</span>&#160;      str.replace(pos, fromLen, to);</div><div class="line"><a name="l00208"></a><span class="lineno">  208</span>&#160;      pos += toLen;</div><div class="line"><a name="l00209"></a><span class="lineno">  209</span>&#160;    }</div><div class="line"><a name="l00210"></a><span class="lineno">  210</span>&#160;  }</div><div class="line"><a name="l00211"></a><span class="lineno">  211</span>&#160;</div><div class="line"><a name="l00215"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#ac2c522f4bc20ea7b08a921fb8380c9e7">  215</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">string</span> <a class="code" href="classopencc_1_1_u_t_f8_util.html#ac2c522f4bc20ea7b08a921fb8380c9e7">Join</a>(<span class="keyword">const</span> vector&lt;string&gt;&amp; strings, <span class="keyword">const</span> <span class="keywordtype">string</span>&amp; separator) {</div><div class="line"><a name="l00216"></a><span class="lineno">  216</span>&#160;    std::ostringstream buffer;</div><div class="line"><a name="l00217"></a><span class="lineno">  217</span>&#160;    <span class="keywordtype">bool</span> first = <span class="keyword">true</span>;</div><div class="line"><a name="l00218"></a><span class="lineno">  218</span>&#160;    <span class="keywordflow">for</span> (<span class="keyword">const</span> <span class="keyword">auto</span>&amp; str : strings) {</div><div class="line"><a name="l00219"></a><span class="lineno">  219</span>&#160;      <span class="keywordflow">if</span> (!first) {</div><div class="line"><a name="l00220"></a><span class="lineno">  220</span>&#160;        buffer &lt;&lt; separator;</div><div class="line"><a name="l00221"></a><span class="lineno">  221</span>&#160;      }</div><div class="line"><a name="l00222"></a><span class="lineno">  222</span>&#160;      buffer &lt;&lt; str;</div><div class="line"><a name="l00223"></a><span class="lineno">  223</span>&#160;      first = <span class="keyword">false</span>;</div><div class="line"><a name="l00224"></a><span class="lineno">  224</span>&#160;    }</div><div class="line"><a name="l00225"></a><span class="lineno">  225</span>&#160;    <span class="keywordflow">return</span> buffer.str();</div><div class="line"><a name="l00226"></a><span class="lineno">  226</span>&#160;  }</div><div class="line"><a name="l00227"></a><span class="lineno">  227</span>&#160;</div><div class="line"><a name="l00231"></a><span class="lineno"><a class="line" href="classopencc_1_1_u_t_f8_util.html#aec5b28619d5a84d13abcc193f6f2bcc4">  231</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">string</span> <a class="code" href="classopencc_1_1_u_t_f8_util.html#aec5b28619d5a84d13abcc193f6f2bcc4">Join</a>(<span class="keyword">const</span> vector&lt;string&gt;&amp; strings) {</div><div class="line"><a name="l00232"></a><span class="lineno">  232</span>&#160;    std::ostringstream buffer;</div><div class="line"><a name="l00233"></a><span class="lineno">  233</span>&#160;    <span class="keywordflow">for</span> (<span class="keyword">const</span> <span class="keyword">auto</span>&amp; str : strings) {</div><div class="line"><a name="l00234"></a><span class="lineno">  234</span>&#160;      buffer &lt;&lt; str;</div><div class="line"><a name="l00235"></a><span class="lineno">  235</span>&#160;    }</div><div class="line"><a name="l00236"></a><span class="lineno">  236</span>&#160;    <span class="keywordflow">return</span> buffer.str();</div><div class="line"><a name="l00237"></a><span class="lineno">  237</span>&#160;  }</div><div class="line"><a name="l00238"></a><span class="lineno">  238</span>&#160;</div><div class="line"><a name="l00239"></a><span class="lineno">  239</span>&#160;  <span class="keyword">static</span> <span class="keywordtype">void</span> GetByteMap(<span class="keyword">const</span> <span class="keywordtype">char</span>* str, <span class="keyword">const</span> <span class="keywordtype">size_t</span> utf8Length,</div><div class="line"><a name="l00240"></a><span class="lineno">  240</span>&#160;                         vector&lt;size_t&gt;* byteMap) {</div><div class="line"><a name="l00241"></a><span class="lineno">  241</span>&#160;    <span class="keywordflow">if</span> (byteMap-&gt;size() &lt; utf8Length) {</div><div class="line"><a name="l00242"></a><span class="lineno">  242</span>&#160;      byteMap-&gt;resize(utf8Length);</div><div class="line"><a name="l00243"></a><span class="lineno">  243</span>&#160;    }</div><div class="line"><a name="l00244"></a><span class="lineno">  244</span>&#160;    <span class="keyword">const</span> <span class="keywordtype">char</span>* pstr = str;</div><div class="line"><a name="l00245"></a><span class="lineno">  245</span>&#160;    <span class="keywordflow">for</span> (<span class="keywordtype">size_t</span> i = 0; i &lt; utf8Length; i++) {</div><div class="line"><a name="l00246"></a><span class="lineno">  246</span>&#160;      (*byteMap)[i] = pstr - str;</div><div class="line"><a name="l00247"></a><span class="lineno">  247</span>&#160;      pstr = NextChar(pstr);</div><div class="line"><a name="l00248"></a><span class="lineno">  248</span>&#160;    }</div><div class="line"><a name="l00249"></a><span class="lineno">  249</span>&#160;  }</div><div class="line"><a name="l00250"></a><span class="lineno">  250</span>&#160;</div><div class="line"><a name="l00251"></a><span class="lineno">  251</span>&#160;<span class="preprocessor">#ifdef _MSC_VER</span></div><div class="line"><a name="l00252"></a><span class="lineno">  252</span>&#160;  <span class="keyword">static</span> std::wstring GetPlatformString(<span class="keyword">const</span> std::string&amp; str) {</div><div class="line"><a name="l00253"></a><span class="lineno">  253</span>&#160;    <span class="keywordflow">return</span> U8ToU16(str);</div><div class="line"><a name="l00254"></a><span class="lineno">  254</span>&#160;  }</div><div class="line"><a name="l00255"></a><span class="lineno">  255</span>&#160;<span class="preprocessor">#else</span></div><div class="line"><a name="l00256"></a><span class="lineno">  256</span>&#160;  <span class="keyword">static</span> std::string GetPlatformString(<span class="keyword">const</span> std::string&amp; str) {</div><div class="line"><a name="l00257"></a><span class="lineno">  257</span>&#160;    <span class="keywordflow">return</span> str;</div><div class="line"><a name="l00258"></a><span class="lineno">  258</span>&#160;  }</div><div class="line"><a name="l00259"></a><span class="lineno">  259</span>&#160;<span class="preprocessor">#endif // _MSC_VER</span></div><div class="line"><a name="l00260"></a><span class="lineno">  260</span>&#160;</div><div class="line"><a name="l00261"></a><span class="lineno">  261</span>&#160;</div><div class="line"><a name="l00262"></a><span class="lineno">  262</span>&#160;<span class="preprocessor">#ifdef _MSC_VER</span></div><div class="line"><a name="l00263"></a><span class="lineno">  263</span>&#160;  <span class="keyword">static</span> std::string U16ToU8(<span class="keyword">const</span> std::wstring&amp; wstr) {</div><div class="line"><a name="l00264"></a><span class="lineno">  264</span>&#160;    std::string ret;</div><div class="line"><a name="l00265"></a><span class="lineno">  265</span>&#160;    <span class="keywordtype">int</span> convcnt = WideCharToMultiByte(CP_UTF8, 0, wstr.c_str(), wstr.length(), NULL, 0, NULL, NULL);</div><div class="line"><a name="l00266"></a><span class="lineno">  266</span>&#160;    <span class="keywordflow">if</span> (convcnt &gt; 0) {</div><div class="line"><a name="l00267"></a><span class="lineno">  267</span>&#160;      ret.resize(convcnt);</div><div class="line"><a name="l00268"></a><span class="lineno">  268</span>&#160;      WideCharToMultiByte(CP_UTF8, 0, wstr.c_str(), wstr.length(), &amp;ret[0], convcnt, NULL, NULL);</div><div class="line"><a name="l00269"></a><span class="lineno">  269</span>&#160;    }</div><div class="line"><a name="l00270"></a><span class="lineno">  270</span>&#160;    <span class="keywordflow">return</span> ret;</div><div class="line"><a name="l00271"></a><span class="lineno">  271</span>&#160;  }</div><div class="line"><a name="l00272"></a><span class="lineno">  272</span>&#160;</div><div class="line"><a name="l00273"></a><span class="lineno">  273</span>&#160;  <span class="keyword">static</span> std::wstring U8ToU16(<span class="keyword">const</span> std::string&amp; str) {</div><div class="line"><a name="l00274"></a><span class="lineno">  274</span>&#160;    std::wstring ret;</div><div class="line"><a name="l00275"></a><span class="lineno">  275</span>&#160;    <span class="keywordtype">int</span> convcnt = MultiByteToWideChar(CP_UTF8, 0, str.c_str(), str.length(), NULL, 0);</div><div class="line"><a name="l00276"></a><span class="lineno">  276</span>&#160;    <span class="keywordflow">if</span> (convcnt &gt; 0) {</div><div class="line"><a name="l00277"></a><span class="lineno">  277</span>&#160;      ret.resize(convcnt);</div><div class="line"><a name="l00278"></a><span class="lineno">  278</span>&#160;      MultiByteToWideChar(CP_UTF8, 0, str.c_str(), str.length(), &amp;ret[0], convcnt);</div><div class="line"><a name="l00279"></a><span class="lineno">  279</span>&#160;    }</div><div class="line"><a name="l00280"></a><span class="lineno">  280</span>&#160;    <span class="keywordflow">return</span> ret;</div><div class="line"><a name="l00281"></a><span class="lineno">  281</span>&#160;  }</div><div class="line"><a name="l00282"></a><span class="lineno">  282</span>&#160;<span class="preprocessor">#endif // _MSC_VER</span></div><div class="line"><a name="l00283"></a><span class="lineno">  283</span>&#160;};</div><div class="line"><a name="l00284"></a><span class="lineno">  284</span>&#160;}</div><div class="ttc" id="classopencc_1_1_u_t_f8_util_html_a153a270ce21d855c07a7d5eba397da5e"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#a153a270ce21d855c07a7d5eba397da5e">opencc::UTF8Util::PrevCharLength</a></div><div class="ttdeci">static size_t PrevCharLength(const char *str)</div><div class="ttdoc">Returns the length in byte for the previous UTF8 character. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:77</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_aec5b28619d5a84d13abcc193f6f2bcc4"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#aec5b28619d5a84d13abcc193f6f2bcc4">opencc::UTF8Util::Join</a></div><div class="ttdeci">static string Join(const vector&lt; string &gt; &amp;strings)</div><div class="ttdoc">Joins a string vector in to a string. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:231</div></div>
<div class="ttc" id="classopencc_1_1_invalid_u_t_f8_html"><div class="ttname"><a href="classopencc_1_1_invalid_u_t_f8.html">opencc::InvalidUTF8</a></div><div class="ttdef"><b>Definition:</b> Exception.hpp:77</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_ac2c522f4bc20ea7b08a921fb8380c9e7"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#ac2c522f4bc20ea7b08a921fb8380c9e7">opencc::UTF8Util::Join</a></div><div class="ttdeci">static string Join(const vector&lt; string &gt; &amp;strings, const string &amp;separator)</div><div class="ttdoc">Joins a string vector in to a string with a separator. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:215</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_ae212d8ca540b33752e2ff373f842479c"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#ae212d8ca540b33752e2ff373f842479c">opencc::UTF8Util::TruncateUTF8</a></div><div class="ttdeci">static string TruncateUTF8(const char *str, size_t maxByteLength)</div><div class="ttdoc">Truncates a string with a maximal length in byte. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:179</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_af2cf133ab5574e3267a8726a5b766a9d"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#af2cf133ab5574e3267a8726a5b766a9d">opencc::UTF8Util::ReplaceAll</a></div><div class="ttdeci">static void ReplaceAll(string &amp;str, const char *from, const char *to)</div><div class="ttdoc">Replaces all patterns in a string in place. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:202</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_afefc07b662cd10ebe998685e2ce3b72d"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#afefc07b662cd10ebe998685e2ce3b72d">opencc::UTF8Util::FromSubstr</a></div><div class="ttdeci">static string FromSubstr(const char *str, size_t length)</div><div class="ttdoc">Copies a substring with given length to a new std::string. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:154</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_a8ee1ac13118c59a357114782d18a3497"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#a8ee1ac13118c59a357114782d18a3497">opencc::UTF8Util::NotShorterThan</a></div><div class="ttdeci">static bool NotShorterThan(const char *str, size_t byteLength)</div><div class="ttdoc">Returns true if the given string is longer or as long as the given length. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:164</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_ac0642244a71d77d3e79829a7952f9b86"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#ac0642244a71d77d3e79829a7952f9b86">opencc::UTF8Util::Length</a></div><div class="ttdeci">static size_t Length(const char *str)</div><div class="ttdoc">Returns the UTF8 length of a valid UTF8 string. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:122</div></div>
<div class="ttc" id="namespaceopencc_html"><div class="ttname"><a href="namespaceopencc.html">opencc</a></div><div class="ttdef"><b>Definition:</b> BinaryDict.hpp:24</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_ab6031f3d1a95f66c51a142d5c2794614"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#ab6031f3d1a95f66c51a142d5c2794614">opencc::UTF8Util::PrevChar</a></div><div class="ttdeci">static const char * PrevChar(const char *str)</div><div class="ttdoc">Move the char* pointer before the previous UTF8 character. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:115</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_ae26e05a30598021e204448ea71971208"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#ae26e05a30598021e204448ea71971208">opencc::UTF8Util::NextChar</a></div><div class="ttdeci">static const char * NextChar(const char *str)</div><div class="ttdoc">Returns the char* pointer over the next UTF8 character. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:108</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html">opencc::UTF8Util</a></div><div class="ttdoc">UTF8 string utilities. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:34</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_a3c9791916dd617caa7eef44a67900c20"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#a3c9791916dd617caa7eef44a67900c20">opencc::UTF8Util::FindNextInline</a></div><div class="ttdeci">static const char * FindNextInline(const char *str, const char ch)</div><div class="ttdoc">Finds a character in the same line. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:137</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_ae71013ee7dfef2aba9e99dbae8f24bbd"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#ae71013ee7dfef2aba9e99dbae8f24bbd">opencc::UTF8Util::NextCharLength</a></div><div class="ttdeci">static size_t NextCharLength(const char *str)</div><div class="ttdoc">Returns the length in byte for the next UTF8 character. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:66</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_a008b85311545f43a7a3c14e304004266"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#a008b85311545f43a7a3c14e304004266">opencc::UTF8Util::IsLineEndingOrFileEnding</a></div><div class="ttdeci">static bool IsLineEndingOrFileEnding(const char ch)</div><div class="ttdoc">Returns ture if the character is a line ending or end of file. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:147</div></div>
<div class="ttc" id="classopencc_1_1_u_t_f8_util_html_a7741e8ca4c6ad9e4f68b9d4633b58def"><div class="ttname"><a href="classopencc_1_1_u_t_f8_util.html#a7741e8ca4c6ad9e4f68b9d4633b58def">opencc::UTF8Util::NextCharLengthNoException</a></div><div class="ttdeci">static size_t NextCharLengthNoException(const char *str)</div><div class="ttdoc">Returns the length in byte for the next UTF8 character. </div><div class="ttdef"><b>Definition:</b> UTF8Util.hpp:45</div></div>
</div><!-- fragment --></div><!-- contents -->
<!-- start footer part -->
<hr class="footer"/><address class="footer"><small>
Generated on Fri Jan 20 2017 07:15:35 for Open Chinese Convert by &#160;<a href="http://www.doxygen.org/index.html">
<img class="footer" src="doxygen.png" alt="doxygen"/>
</a> 1.8.13
</small></address>
</body>
</html>