mirror of
https://github.com/boostorg/locale.git
synced 2026-02-26 16:52:26 +00:00
476 lines
50 KiB
HTML
476 lines
50 KiB
HTML
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
|
|
<html xmlns="http://www.w3.org/1999/xhtml">
|
|
<head>
|
|
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
|
|
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
|
|
<title>Boost.Locale: boost/locale/utf.hpp Source File</title>
|
|
|
|
<link href="tabs.css" rel="stylesheet" type="text/css"/>
|
|
<link href="doxygen.css" rel="stylesheet" type="text/css" />
|
|
<link href="navtree.css" rel="stylesheet" type="text/css"/>
|
|
<script type="text/javascript" src="jquery.js"></script>
|
|
<script type="text/javascript" src="resize.js"></script>
|
|
<script type="text/javascript" src="navtree.js"></script>
|
|
<script type="text/javascript">
|
|
$(document).ready(initResizable);
|
|
</script>
|
|
|
|
|
|
</head>
|
|
<body>
|
|
<div id="top"><!-- do not remove this div! -->
|
|
|
|
|
|
<div id="titlearea">
|
|
<table cellspacing="0" cellpadding="0">
|
|
<tbody>
|
|
<tr style="height: 56px;">
|
|
|
|
<td id="projectlogo"><img alt="Logo" src="boost-small.png"/></td>
|
|
|
|
|
|
<td style="padding-left: 0.5em;">
|
|
<div id="projectname">Boost.Locale
|
|
|
|
</div>
|
|
|
|
</td>
|
|
|
|
|
|
|
|
</tr>
|
|
</tbody>
|
|
</table>
|
|
</div>
|
|
|
|
<!-- Generated by Doxygen 1.7.6.1 -->
|
|
<div id="navrow1" class="tabs">
|
|
<ul class="tablist">
|
|
<li><a href="index.html"><span>Main Page</span></a></li>
|
|
<li><a href="modules.html"><span>Modules</span></a></li>
|
|
<li><a href="namespaces.html"><span>Namespaces</span></a></li>
|
|
<li><a href="annotated.html"><span>Classes</span></a></li>
|
|
<li class="current"><a href="files.html"><span>Files</span></a></li>
|
|
<li><a href="examples.html"><span>Examples</span></a></li>
|
|
</ul>
|
|
</div>
|
|
<div id="navrow2" class="tabs2">
|
|
<ul class="tablist">
|
|
<li><a href="files.html"><span>File List</span></a></li>
|
|
</ul>
|
|
</div>
|
|
</div>
|
|
<div id="side-nav" class="ui-resizable side-nav-resizable">
|
|
<div id="nav-tree">
|
|
<div id="nav-tree-contents">
|
|
</div>
|
|
</div>
|
|
<div id="splitbar" style="-moz-user-select:none;"
|
|
class="ui-resizable-handle">
|
|
</div>
|
|
</div>
|
|
<script type="text/javascript">
|
|
initNavTree('utf_8hpp.html','');
|
|
</script>
|
|
<div id="doc-content">
|
|
<div class="header">
|
|
<div class="headertitle">
|
|
<div class="title">boost/locale/utf.hpp</div> </div>
|
|
</div><!--header-->
|
|
<div class="contents">
|
|
<div class="fragment"><pre class="fragment"><a name="l00001"></a>00001 <span class="comment">//</span>
|
|
<a name="l00002"></a>00002 <span class="comment">// Copyright (c) 2009-2011 Artyom Beilis (Tonkikh)</span>
|
|
<a name="l00003"></a>00003 <span class="comment">//</span>
|
|
<a name="l00004"></a>00004 <span class="comment">// Distributed under the Boost Software License, Version 1.0. (See</span>
|
|
<a name="l00005"></a>00005 <span class="comment">// accompanying file LICENSE_1_0.txt or copy at</span>
|
|
<a name="l00006"></a>00006 <span class="comment">// http://www.boost.org/LICENSE_1_0.txt)</span>
|
|
<a name="l00007"></a>00007 <span class="comment">//</span>
|
|
<a name="l00008"></a>00008 <span class="preprocessor">#ifndef BOOST_LOCALE_UTF_HPP_INCLUDED</span>
|
|
<a name="l00009"></a>00009 <span class="preprocessor"></span><span class="preprocessor">#define BOOST_LOCALE_UTF_HPP_INCLUDED</span>
|
|
<a name="l00010"></a>00010 <span class="preprocessor"></span>
|
|
<a name="l00011"></a>00011 <span class="preprocessor">#include <boost/cstdint.hpp></span>
|
|
<a name="l00012"></a>00012
|
|
<a name="l00013"></a>00013 <span class="keyword">namespace </span>boost {
|
|
<a name="l00014"></a>00014 <span class="keyword">namespace </span>locale {
|
|
<a name="l00020"></a><a class="code" href="namespaceboost_1_1locale_1_1utf.html">00020</a> <span class="keyword">namespace </span>utf {
|
|
<a name="l00022"></a>00022 <span class="preprocessor"> #ifdef __GNUC__</span>
|
|
<a name="l00023"></a>00023 <span class="preprocessor"></span><span class="preprocessor"> # define BOOST_LOCALE_LIKELY(x) __builtin_expect((x),1)</span>
|
|
<a name="l00024"></a>00024 <span class="preprocessor"></span><span class="preprocessor"> # define BOOST_LOCALE_UNLIKELY(x) __builtin_expect((x),0)</span>
|
|
<a name="l00025"></a>00025 <span class="preprocessor"></span><span class="preprocessor"> #else</span>
|
|
<a name="l00026"></a>00026 <span class="preprocessor"></span><span class="preprocessor"> # define BOOST_LOCALE_LIKELY(x) (x)</span>
|
|
<a name="l00027"></a>00027 <span class="preprocessor"></span><span class="preprocessor"> # define BOOST_LOCALE_UNLIKELY(x) (x)</span>
|
|
<a name="l00028"></a>00028 <span class="preprocessor"></span><span class="preprocessor"> #endif</span>
|
|
<a name="l00029"></a>00029 <span class="preprocessor"></span>
|
|
<a name="l00030"></a>00030
|
|
<a name="l00034"></a><a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8">00034</a> <span class="keyword">typedef</span> uint32_t <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a>;
|
|
<a name="l00035"></a>00035
|
|
<a name="l00039"></a><a class="code" href="namespaceboost_1_1locale_1_1utf.html#a30010000878c7732340bda8956b844fb">00039</a> <span class="keyword">static</span> <span class="keyword">const</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a30010000878c7732340bda8956b844fb" title="Special constant that defines illegal code point.">illegal</a> = 0xFFFFFFFFu;
|
|
<a name="l00040"></a>00040
|
|
<a name="l00044"></a><a class="code" href="namespaceboost_1_1locale_1_1utf.html#a20dbe458fd18229a0e6c09888d031b38">00044</a> <span class="keyword">static</span> <span class="keyword">const</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a20dbe458fd18229a0e6c09888d031b38" title="Special constant that defines incomplete code point.">incomplete</a> = 0xFFFFFFFEu;
|
|
<a name="l00045"></a>00045
|
|
<a name="l00049"></a><a class="code" href="namespaceboost_1_1locale_1_1utf.html#a189805c4e9f4c033ce5f88daf780e08e">00049</a> <span class="keyword">inline</span> <span class="keywordtype">bool</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a189805c4e9f4c033ce5f88daf780e08e" title="the function checks if v is a valid code point">is_valid_codepoint</a>(<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> v)
|
|
<a name="l00050"></a>00050 {
|
|
<a name="l00051"></a>00051 <span class="keywordflow">if</span>(v>0x10FFFF)
|
|
<a name="l00052"></a>00052 <span class="keywordflow">return</span> <span class="keyword">false</span>;
|
|
<a name="l00053"></a>00053 <span class="keywordflow">if</span>(0xD800 <=v && v<= 0xDFFF) <span class="comment">// surragates</span>
|
|
<a name="l00054"></a>00054 <span class="keywordflow">return</span> <span class="keyword">false</span>;
|
|
<a name="l00055"></a>00055 <span class="keywordflow">return</span> <span class="keyword">true</span>;
|
|
<a name="l00056"></a>00056 }
|
|
<a name="l00057"></a>00057
|
|
<a name="l00058"></a>00058 <span class="preprocessor"> #ifdef BOOST_LOCALE_DOXYGEN</span>
|
|
<a name="l00059"></a>00059 <span class="preprocessor"></span>
|
|
<a name="l00060"></a>00060
|
|
<a name="l00061"></a>00061
|
|
<a name="l00062"></a>00062 <span class="keyword">template</span><<span class="keyword">typename</span> CharType,<span class="keywordtype">int</span> size=sizeof(CharType)>
|
|
<a name="l00063"></a><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html">00063</a> <span class="keyword">struct </span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html" title="UTF Traits class - functions to convert UTF sequences to and from Unicode code points.">utf_traits</a> {
|
|
<a name="l00067"></a><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">00067</a> <span class="keyword">typedef</span> CharType <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a>;
|
|
<a name="l00082"></a>00082 <span class="keyword">template</span><<span class="keyword">typename</span> Iterator>
|
|
<a name="l00083"></a>00083 <span class="keyword">static</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a9b6b01fa6705ba67ac78359ddee03213">decode</a>(Iterator &p,Iterator e);
|
|
<a name="l00084"></a>00084
|
|
<a name="l00092"></a><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#abb4cb63a924d19505c2cb6e930c68a13">00092</a> <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#abb4cb63a924d19505c2cb6e930c68a13">max_width</a>;
|
|
<a name="l00099"></a>00099 <span class="keyword">static</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a26c106ec8816f48431f882017ab46763">width</a>(<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> value);
|
|
<a name="l00100"></a>00100
|
|
<a name="l00106"></a>00106 <span class="keyword">static</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a8a6b72ba87a817652f522018df51a9a7">trail_length</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> c);
|
|
<a name="l00110"></a>00110 <span class="keyword">static</span> <span class="keywordtype">bool</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#ae2cb78fcb8a58bed3e0ce1d6528a719a">is_trail</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> c);
|
|
<a name="l00114"></a>00114 <span class="keyword">static</span> <span class="keywordtype">bool</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a19789c4c26c8d9f576de5272f3d41a11">is_lead</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> c);
|
|
<a name="l00115"></a>00115
|
|
<a name="l00126"></a>00126 <span class="keyword">template</span><<span class="keyword">typename</span> Iterator>
|
|
<a name="l00127"></a>00127 <span class="keyword">static</span> Iterator <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#acd59f628af084f800f8a86cdd8124fd8">encode</a>(<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> value,Iterator out);
|
|
<a name="l00133"></a>00133 <span class="keyword">template</span><<span class="keyword">typename</span> Iterator>
|
|
<a name="l00134"></a>00134 <span class="keyword">static</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a8ff625b2c19b0d4132f7ec9e6303cb36">decode_valid</a>(Iterator &p);
|
|
<a name="l00135"></a>00135 };
|
|
<a name="l00136"></a>00136
|
|
<a name="l00137"></a>00137 <span class="preprocessor"> #else</span>
|
|
<a name="l00138"></a>00138 <span class="preprocessor"></span>
|
|
<a name="l00139"></a>00139 <span class="keyword">template</span><<span class="keyword">typename</span> CharType,<span class="keywordtype">int</span> size=sizeof(CharType)>
|
|
<a name="l00140"></a>00140 <span class="keyword">struct </span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html" title="UTF Traits class - functions to convert UTF sequences to and from Unicode code points.">utf_traits</a>;
|
|
<a name="l00141"></a>00141
|
|
<a name="l00142"></a>00142 <span class="keyword">template</span><<span class="keyword">typename</span> CharType>
|
|
<a name="l00143"></a>00143 <span class="keyword">struct </span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html" title="UTF Traits class - functions to convert UTF sequences to and from Unicode code points.">utf_traits</a><CharType,1> {
|
|
<a name="l00144"></a>00144
|
|
<a name="l00145"></a>00145 <span class="keyword">typedef</span> CharType <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a>;
|
|
<a name="l00146"></a>00146
|
|
<a name="l00147"></a>00147 <span class="keyword">static</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a8a6b72ba87a817652f522018df51a9a7">trail_length</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> ci)
|
|
<a name="l00148"></a>00148 {
|
|
<a name="l00149"></a>00149 <span class="keywordtype">unsigned</span> <span class="keywordtype">char</span> c = ci;
|
|
<a name="l00150"></a>00150 <span class="keywordflow">if</span>(c < 128)
|
|
<a name="l00151"></a>00151 <span class="keywordflow">return</span> 0;
|
|
<a name="l00152"></a>00152 <span class="keywordflow">if</span>(BOOST_LOCALE_UNLIKELY(c < 194))
|
|
<a name="l00153"></a>00153 <span class="keywordflow">return</span> -1;
|
|
<a name="l00154"></a>00154 <span class="keywordflow">if</span>(c < 224)
|
|
<a name="l00155"></a>00155 <span class="keywordflow">return</span> 1;
|
|
<a name="l00156"></a>00156 <span class="keywordflow">if</span>(c < 240)
|
|
<a name="l00157"></a>00157 <span class="keywordflow">return</span> 2;
|
|
<a name="l00158"></a>00158 <span class="keywordflow">if</span>(BOOST_LOCALE_LIKELY(c <=244))
|
|
<a name="l00159"></a>00159 <span class="keywordflow">return</span> 3;
|
|
<a name="l00160"></a>00160 <span class="keywordflow">return</span> -1;
|
|
<a name="l00161"></a>00161 }
|
|
<a name="l00162"></a>00162
|
|
<a name="l00163"></a>00163 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#abb4cb63a924d19505c2cb6e930c68a13">max_width</a> = 4;
|
|
<a name="l00164"></a>00164
|
|
<a name="l00165"></a>00165 <span class="keyword">static</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a26c106ec8816f48431f882017ab46763">width</a>(<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> value)
|
|
<a name="l00166"></a>00166 {
|
|
<a name="l00167"></a>00167 <span class="keywordflow">if</span>(value <=0x7F) {
|
|
<a name="l00168"></a>00168 <span class="keywordflow">return</span> 1;
|
|
<a name="l00169"></a>00169 }
|
|
<a name="l00170"></a>00170 <span class="keywordflow">else</span> <span class="keywordflow">if</span>(value <=0x7FF) {
|
|
<a name="l00171"></a>00171 <span class="keywordflow">return</span> 2;
|
|
<a name="l00172"></a>00172 }
|
|
<a name="l00173"></a>00173 <span class="keywordflow">else</span> <span class="keywordflow">if</span>(BOOST_LOCALE_LIKELY(value <=0xFFFF)) {
|
|
<a name="l00174"></a>00174 <span class="keywordflow">return</span> 3;
|
|
<a name="l00175"></a>00175 }
|
|
<a name="l00176"></a>00176 <span class="keywordflow">else</span> {
|
|
<a name="l00177"></a>00177 <span class="keywordflow">return</span> 4;
|
|
<a name="l00178"></a>00178 }
|
|
<a name="l00179"></a>00179 }
|
|
<a name="l00180"></a>00180
|
|
<a name="l00181"></a>00181 <span class="keyword">static</span> <span class="keywordtype">bool</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#ae2cb78fcb8a58bed3e0ce1d6528a719a">is_trail</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> ci)
|
|
<a name="l00182"></a>00182 {
|
|
<a name="l00183"></a>00183 <span class="keywordtype">unsigned</span> <span class="keywordtype">char</span> c=ci;
|
|
<a name="l00184"></a>00184 <span class="keywordflow">return</span> (c & 0xC0)==0x80;
|
|
<a name="l00185"></a>00185 }
|
|
<a name="l00186"></a>00186
|
|
<a name="l00187"></a>00187 <span class="keyword">static</span> <span class="keywordtype">bool</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a19789c4c26c8d9f576de5272f3d41a11">is_lead</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> ci)
|
|
<a name="l00188"></a>00188 {
|
|
<a name="l00189"></a>00189 <span class="keywordflow">return</span> !<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#ae2cb78fcb8a58bed3e0ce1d6528a719a">is_trail</a>(ci);
|
|
<a name="l00190"></a>00190 }
|
|
<a name="l00191"></a>00191
|
|
<a name="l00192"></a>00192 <span class="keyword">template</span><<span class="keyword">typename</span> Iterator>
|
|
<a name="l00193"></a>00193 <span class="keyword">static</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a9b6b01fa6705ba67ac78359ddee03213">decode</a>(Iterator &p,Iterator e)
|
|
<a name="l00194"></a>00194 {
|
|
<a name="l00195"></a>00195 <span class="keywordflow">if</span>(BOOST_LOCALE_UNLIKELY(p==e))
|
|
<a name="l00196"></a>00196 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a20dbe458fd18229a0e6c09888d031b38" title="Special constant that defines incomplete code point.">incomplete</a>;
|
|
<a name="l00197"></a>00197
|
|
<a name="l00198"></a>00198 <span class="keywordtype">unsigned</span> <span class="keywordtype">char</span> lead = *p++;
|
|
<a name="l00199"></a>00199
|
|
<a name="l00200"></a>00200 <span class="comment">// First byte is fully validated here</span>
|
|
<a name="l00201"></a>00201 <span class="keywordtype">int</span> trail_size = <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a8a6b72ba87a817652f522018df51a9a7">trail_length</a>(lead);
|
|
<a name="l00202"></a>00202
|
|
<a name="l00203"></a>00203 <span class="keywordflow">if</span>(BOOST_LOCALE_UNLIKELY(trail_size < 0))
|
|
<a name="l00204"></a>00204 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a30010000878c7732340bda8956b844fb" title="Special constant that defines illegal code point.">illegal</a>;
|
|
<a name="l00205"></a>00205
|
|
<a name="l00206"></a>00206 <span class="comment">//</span>
|
|
<a name="l00207"></a>00207 <span class="comment">// Ok as only ASCII may be of size = 0</span>
|
|
<a name="l00208"></a>00208 <span class="comment">// also optimize for ASCII text</span>
|
|
<a name="l00209"></a>00209 <span class="comment">//</span>
|
|
<a name="l00210"></a>00210 <span class="keywordflow">if</span>(trail_size == 0)
|
|
<a name="l00211"></a>00211 <span class="keywordflow">return</span> lead;
|
|
<a name="l00212"></a>00212
|
|
<a name="l00213"></a>00213 <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> c = lead & ((1<<(6-trail_size))-1);
|
|
<a name="l00214"></a>00214
|
|
<a name="l00215"></a>00215 <span class="comment">// Read the rest</span>
|
|
<a name="l00216"></a>00216 <span class="keywordtype">unsigned</span> <span class="keywordtype">char</span> tmp;
|
|
<a name="l00217"></a>00217 <span class="keywordflow">switch</span>(trail_size) {
|
|
<a name="l00218"></a>00218 <span class="keywordflow">case</span> 3:
|
|
<a name="l00219"></a>00219 <span class="keywordflow">if</span>(BOOST_LOCALE_UNLIKELY(p==e))
|
|
<a name="l00220"></a>00220 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a20dbe458fd18229a0e6c09888d031b38" title="Special constant that defines incomplete code point.">incomplete</a>;
|
|
<a name="l00221"></a>00221 tmp = *p++;
|
|
<a name="l00222"></a>00222 <span class="keywordflow">if</span> (!<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#ae2cb78fcb8a58bed3e0ce1d6528a719a">is_trail</a>(tmp))
|
|
<a name="l00223"></a>00223 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a30010000878c7732340bda8956b844fb" title="Special constant that defines illegal code point.">illegal</a>;
|
|
<a name="l00224"></a>00224 c = (c << 6) | ( tmp & 0x3F);
|
|
<a name="l00225"></a>00225 <span class="keywordflow">case</span> 2:
|
|
<a name="l00226"></a>00226 <span class="keywordflow">if</span>(BOOST_LOCALE_UNLIKELY(p==e))
|
|
<a name="l00227"></a>00227 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a20dbe458fd18229a0e6c09888d031b38" title="Special constant that defines incomplete code point.">incomplete</a>;
|
|
<a name="l00228"></a>00228 tmp = *p++;
|
|
<a name="l00229"></a>00229 <span class="keywordflow">if</span> (!<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#ae2cb78fcb8a58bed3e0ce1d6528a719a">is_trail</a>(tmp))
|
|
<a name="l00230"></a>00230 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a30010000878c7732340bda8956b844fb" title="Special constant that defines illegal code point.">illegal</a>;
|
|
<a name="l00231"></a>00231 c = (c << 6) | ( tmp & 0x3F);
|
|
<a name="l00232"></a>00232 <span class="keywordflow">case</span> 1:
|
|
<a name="l00233"></a>00233 <span class="keywordflow">if</span>(BOOST_LOCALE_UNLIKELY(p==e))
|
|
<a name="l00234"></a>00234 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a20dbe458fd18229a0e6c09888d031b38" title="Special constant that defines incomplete code point.">incomplete</a>;
|
|
<a name="l00235"></a>00235 tmp = *p++;
|
|
<a name="l00236"></a>00236 <span class="keywordflow">if</span> (!<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#ae2cb78fcb8a58bed3e0ce1d6528a719a">is_trail</a>(tmp))
|
|
<a name="l00237"></a>00237 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a30010000878c7732340bda8956b844fb" title="Special constant that defines illegal code point.">illegal</a>;
|
|
<a name="l00238"></a>00238 c = (c << 6) | ( tmp & 0x3F);
|
|
<a name="l00239"></a>00239 }
|
|
<a name="l00240"></a>00240
|
|
<a name="l00241"></a>00241 <span class="comment">// Check code point validity: no surrogates and</span>
|
|
<a name="l00242"></a>00242 <span class="comment">// valid range</span>
|
|
<a name="l00243"></a>00243 <span class="keywordflow">if</span>(BOOST_LOCALE_UNLIKELY(!<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a189805c4e9f4c033ce5f88daf780e08e" title="the function checks if v is a valid code point">is_valid_codepoint</a>(c)))
|
|
<a name="l00244"></a>00244 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a30010000878c7732340bda8956b844fb" title="Special constant that defines illegal code point.">illegal</a>;
|
|
<a name="l00245"></a>00245
|
|
<a name="l00246"></a>00246 <span class="comment">// make sure it is the most compact representation</span>
|
|
<a name="l00247"></a>00247 <span class="keywordflow">if</span>(BOOST_LOCALE_UNLIKELY(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a26c106ec8816f48431f882017ab46763">width</a>(c)!=trail_size + 1))
|
|
<a name="l00248"></a>00248 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a30010000878c7732340bda8956b844fb" title="Special constant that defines illegal code point.">illegal</a>;
|
|
<a name="l00249"></a>00249
|
|
<a name="l00250"></a>00250 <span class="keywordflow">return</span> c;
|
|
<a name="l00251"></a>00251
|
|
<a name="l00252"></a>00252 }
|
|
<a name="l00253"></a>00253
|
|
<a name="l00254"></a>00254 <span class="keyword">template</span><<span class="keyword">typename</span> Iterator>
|
|
<a name="l00255"></a>00255 <span class="keyword">static</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a8ff625b2c19b0d4132f7ec9e6303cb36">decode_valid</a>(Iterator &p)
|
|
<a name="l00256"></a>00256 {
|
|
<a name="l00257"></a>00257 <span class="keywordtype">unsigned</span> <span class="keywordtype">char</span> lead = *p++;
|
|
<a name="l00258"></a>00258 <span class="keywordflow">if</span>(lead < 192)
|
|
<a name="l00259"></a>00259 <span class="keywordflow">return</span> lead;
|
|
<a name="l00260"></a>00260
|
|
<a name="l00261"></a>00261 <span class="keywordtype">int</span> trail_size;
|
|
<a name="l00262"></a>00262
|
|
<a name="l00263"></a>00263 <span class="keywordflow">if</span>(lead < 224)
|
|
<a name="l00264"></a>00264 trail_size = 1;
|
|
<a name="l00265"></a>00265 <span class="keywordflow">else</span> <span class="keywordflow">if</span>(BOOST_LOCALE_LIKELY(lead < 240)) <span class="comment">// non-BMP rare</span>
|
|
<a name="l00266"></a>00266 trail_size = 2;
|
|
<a name="l00267"></a>00267 <span class="keywordflow">else</span>
|
|
<a name="l00268"></a>00268 trail_size = 3;
|
|
<a name="l00269"></a>00269
|
|
<a name="l00270"></a>00270 <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> c = lead & ((1<<(6-trail_size))-1);
|
|
<a name="l00271"></a>00271
|
|
<a name="l00272"></a>00272 <span class="keywordflow">switch</span>(trail_size) {
|
|
<a name="l00273"></a>00273 <span class="keywordflow">case</span> 3:
|
|
<a name="l00274"></a>00274 c = (c << 6) | ( static_cast<unsigned char>(*p++) & 0x3F);
|
|
<a name="l00275"></a>00275 <span class="keywordflow">case</span> 2:
|
|
<a name="l00276"></a>00276 c = (c << 6) | ( static_cast<unsigned char>(*p++) & 0x3F);
|
|
<a name="l00277"></a>00277 <span class="keywordflow">case</span> 1:
|
|
<a name="l00278"></a>00278 c = (c << 6) | ( static_cast<unsigned char>(*p++) & 0x3F);
|
|
<a name="l00279"></a>00279 }
|
|
<a name="l00280"></a>00280
|
|
<a name="l00281"></a>00281 <span class="keywordflow">return</span> c;
|
|
<a name="l00282"></a>00282 }
|
|
<a name="l00283"></a>00283
|
|
<a name="l00284"></a>00284
|
|
<a name="l00285"></a>00285
|
|
<a name="l00286"></a>00286 <span class="keyword">template</span><<span class="keyword">typename</span> Iterator>
|
|
<a name="l00287"></a>00287 <span class="keyword">static</span> Iterator <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#acd59f628af084f800f8a86cdd8124fd8">encode</a>(<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> value,Iterator out)
|
|
<a name="l00288"></a>00288 {
|
|
<a name="l00289"></a>00289 <span class="keywordflow">if</span>(value <= 0x7F) {
|
|
<a name="l00290"></a>00290 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>(value);
|
|
<a name="l00291"></a>00291 }
|
|
<a name="l00292"></a>00292 <span class="keywordflow">else</span> <span class="keywordflow">if</span>(value <= 0x7FF) {
|
|
<a name="l00293"></a>00293 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>((value >> 6) | 0xC0);
|
|
<a name="l00294"></a>00294 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>((value & 0x3F) | 0x80);
|
|
<a name="l00295"></a>00295 }
|
|
<a name="l00296"></a>00296 <span class="keywordflow">else</span> <span class="keywordflow">if</span>(BOOST_LOCALE_LIKELY(value <= 0xFFFF)) {
|
|
<a name="l00297"></a>00297 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>((value >> 12) | 0xE0);
|
|
<a name="l00298"></a>00298 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>(((value >> 6) & 0x3F) | 0x80);
|
|
<a name="l00299"></a>00299 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>((value & 0x3F) | 0x80);
|
|
<a name="l00300"></a>00300 }
|
|
<a name="l00301"></a>00301 <span class="keywordflow">else</span> {
|
|
<a name="l00302"></a>00302 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>((value >> 18) | 0xF0);
|
|
<a name="l00303"></a>00303 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>(((value >> 12) & 0x3F) | 0x80);
|
|
<a name="l00304"></a>00304 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>(((value >> 6) & 0x3F) | 0x80);
|
|
<a name="l00305"></a>00305 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>((value & 0x3F) | 0x80);
|
|
<a name="l00306"></a>00306 }
|
|
<a name="l00307"></a>00307 <span class="keywordflow">return</span> out;
|
|
<a name="l00308"></a>00308 }
|
|
<a name="l00309"></a>00309 }; <span class="comment">// utf8</span>
|
|
<a name="l00310"></a>00310
|
|
<a name="l00311"></a>00311 <span class="keyword">template</span><<span class="keyword">typename</span> CharType>
|
|
<a name="l00312"></a>00312 <span class="keyword">struct </span>utf_traits<CharType,2> {
|
|
<a name="l00313"></a>00313 <span class="keyword">typedef</span> CharType <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a>;
|
|
<a name="l00314"></a>00314
|
|
<a name="l00315"></a>00315 <span class="comment">// See RFC 2781</span>
|
|
<a name="l00316"></a>00316 <span class="keyword">static</span> <span class="keywordtype">bool</span> is_first_surrogate(uint16_t x)
|
|
<a name="l00317"></a>00317 {
|
|
<a name="l00318"></a>00318 <span class="keywordflow">return</span> 0xD800 <=x && x<= 0xDBFF;
|
|
<a name="l00319"></a>00319 }
|
|
<a name="l00320"></a>00320 <span class="keyword">static</span> <span class="keywordtype">bool</span> is_second_surrogate(uint16_t x)
|
|
<a name="l00321"></a>00321 {
|
|
<a name="l00322"></a>00322 <span class="keywordflow">return</span> 0xDC00 <=x && x<= 0xDFFF;
|
|
<a name="l00323"></a>00323 }
|
|
<a name="l00324"></a>00324 <span class="keyword">static</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> combine_surrogate(uint16_t w1,uint16_t w2)
|
|
<a name="l00325"></a>00325 {
|
|
<a name="l00326"></a>00326 <span class="keywordflow">return</span> ((<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a>(w1 & 0x3FF) << 10) | (w2 & 0x3FF)) + 0x10000;
|
|
<a name="l00327"></a>00327 }
|
|
<a name="l00328"></a>00328 <span class="keyword">static</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a8a6b72ba87a817652f522018df51a9a7">trail_length</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> c)
|
|
<a name="l00329"></a>00329 {
|
|
<a name="l00330"></a>00330 <span class="keywordflow">if</span>(is_first_surrogate(c))
|
|
<a name="l00331"></a>00331 <span class="keywordflow">return</span> 1;
|
|
<a name="l00332"></a>00332 <span class="keywordflow">if</span>(is_second_surrogate(c))
|
|
<a name="l00333"></a>00333 <span class="keywordflow">return</span> -1;
|
|
<a name="l00334"></a>00334 <span class="keywordflow">return</span> 0;
|
|
<a name="l00335"></a>00335 }
|
|
<a name="l00339"></a>00339 <span class="keyword">static</span> <span class="keywordtype">bool</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#ae2cb78fcb8a58bed3e0ce1d6528a719a">is_trail</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> c)
|
|
<a name="l00340"></a>00340 {
|
|
<a name="l00341"></a>00341 <span class="keywordflow">return</span> is_second_surrogate(c);
|
|
<a name="l00342"></a>00342 }
|
|
<a name="l00346"></a>00346 <span class="keyword">static</span> <span class="keywordtype">bool</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a19789c4c26c8d9f576de5272f3d41a11">is_lead</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> c)
|
|
<a name="l00347"></a>00347 {
|
|
<a name="l00348"></a>00348 <span class="keywordflow">return</span> !is_second_surrogate(c);
|
|
<a name="l00349"></a>00349 }
|
|
<a name="l00350"></a>00350
|
|
<a name="l00351"></a>00351 <span class="keyword">template</span><<span class="keyword">typename</span> It>
|
|
<a name="l00352"></a>00352 <span class="keyword">static</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a9b6b01fa6705ba67ac78359ddee03213">decode</a>(It &current,It last)
|
|
<a name="l00353"></a>00353 {
|
|
<a name="l00354"></a>00354 <span class="keywordflow">if</span>(BOOST_LOCALE_UNLIKELY(current == last))
|
|
<a name="l00355"></a>00355 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a20dbe458fd18229a0e6c09888d031b38" title="Special constant that defines incomplete code point.">incomplete</a>;
|
|
<a name="l00356"></a>00356 uint16_t w1=*current++;
|
|
<a name="l00357"></a>00357 <span class="keywordflow">if</span>(BOOST_LOCALE_LIKELY(w1 < 0xD800 || 0xDFFF < w1)) {
|
|
<a name="l00358"></a>00358 <span class="keywordflow">return</span> w1;
|
|
<a name="l00359"></a>00359 }
|
|
<a name="l00360"></a>00360 <span class="keywordflow">if</span>(w1 > 0xDBFF)
|
|
<a name="l00361"></a>00361 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a30010000878c7732340bda8956b844fb" title="Special constant that defines illegal code point.">illegal</a>;
|
|
<a name="l00362"></a>00362 <span class="keywordflow">if</span>(current==last)
|
|
<a name="l00363"></a>00363 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a20dbe458fd18229a0e6c09888d031b38" title="Special constant that defines incomplete code point.">incomplete</a>;
|
|
<a name="l00364"></a>00364 uint16_t w2=*current++;
|
|
<a name="l00365"></a>00365 <span class="keywordflow">if</span>(w2 < 0xDC00 || 0xDFFF < w2)
|
|
<a name="l00366"></a>00366 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a30010000878c7732340bda8956b844fb" title="Special constant that defines illegal code point.">illegal</a>;
|
|
<a name="l00367"></a>00367 <span class="keywordflow">return</span> combine_surrogate(w1,w2);
|
|
<a name="l00368"></a>00368 }
|
|
<a name="l00369"></a>00369 <span class="keyword">template</span><<span class="keyword">typename</span> It>
|
|
<a name="l00370"></a>00370 <span class="keyword">static</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a8ff625b2c19b0d4132f7ec9e6303cb36">decode_valid</a>(It &current)
|
|
<a name="l00371"></a>00371 {
|
|
<a name="l00372"></a>00372 uint16_t w1=*current++;
|
|
<a name="l00373"></a>00373 <span class="keywordflow">if</span>(BOOST_LOCALE_LIKELY(w1 < 0xD800 || 0xDFFF < w1)) {
|
|
<a name="l00374"></a>00374 <span class="keywordflow">return</span> w1;
|
|
<a name="l00375"></a>00375 }
|
|
<a name="l00376"></a>00376 uint16_t w2=*current++;
|
|
<a name="l00377"></a>00377 <span class="keywordflow">return</span> combine_surrogate(w1,w2);
|
|
<a name="l00378"></a>00378 }
|
|
<a name="l00379"></a>00379
|
|
<a name="l00380"></a>00380 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#abb4cb63a924d19505c2cb6e930c68a13">max_width</a> = 2;
|
|
<a name="l00381"></a>00381 <span class="keyword">static</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a26c106ec8816f48431f882017ab46763">width</a>(<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> u)
|
|
<a name="l00382"></a>00382 {
|
|
<a name="l00383"></a>00383 <span class="keywordflow">return</span> u>=0x10000 ? 2 : 1;
|
|
<a name="l00384"></a>00384 }
|
|
<a name="l00385"></a>00385 <span class="keyword">template</span><<span class="keyword">typename</span> It>
|
|
<a name="l00386"></a>00386 <span class="keyword">static</span> It <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#acd59f628af084f800f8a86cdd8124fd8">encode</a>(<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> u,It out)
|
|
<a name="l00387"></a>00387 {
|
|
<a name="l00388"></a>00388 <span class="keywordflow">if</span>(BOOST_LOCALE_LIKELY(u<=0xFFFF)) {
|
|
<a name="l00389"></a>00389 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>(u);
|
|
<a name="l00390"></a>00390 }
|
|
<a name="l00391"></a>00391 <span class="keywordflow">else</span> {
|
|
<a name="l00392"></a>00392 u -= 0x10000;
|
|
<a name="l00393"></a>00393 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>(0xD800 | (u>>10));
|
|
<a name="l00394"></a>00394 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>(0xDC00 | (u & 0x3FF));
|
|
<a name="l00395"></a>00395 }
|
|
<a name="l00396"></a>00396 <span class="keywordflow">return</span> out;
|
|
<a name="l00397"></a>00397 }
|
|
<a name="l00398"></a>00398 }; <span class="comment">// utf16;</span>
|
|
<a name="l00399"></a>00399
|
|
<a name="l00400"></a>00400
|
|
<a name="l00401"></a>00401 <span class="keyword">template</span><<span class="keyword">typename</span> CharType>
|
|
<a name="l00402"></a>00402 <span class="keyword">struct </span>utf_traits<CharType,4> {
|
|
<a name="l00403"></a>00403 <span class="keyword">typedef</span> CharType <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a>;
|
|
<a name="l00404"></a>00404 <span class="keyword">static</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a8a6b72ba87a817652f522018df51a9a7">trail_length</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> c)
|
|
<a name="l00405"></a>00405 {
|
|
<a name="l00406"></a>00406 <span class="keywordflow">if</span>(<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a189805c4e9f4c033ce5f88daf780e08e" title="the function checks if v is a valid code point">is_valid_codepoint</a>(c))
|
|
<a name="l00407"></a>00407 <span class="keywordflow">return</span> 0;
|
|
<a name="l00408"></a>00408 <span class="keywordflow">return</span> -1;
|
|
<a name="l00409"></a>00409 }
|
|
<a name="l00410"></a>00410 <span class="keyword">static</span> <span class="keywordtype">bool</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#ae2cb78fcb8a58bed3e0ce1d6528a719a">is_trail</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> <span class="comment">/*c*/</span>)
|
|
<a name="l00411"></a>00411 {
|
|
<a name="l00412"></a>00412 <span class="keywordflow">return</span> <span class="keyword">false</span>;
|
|
<a name="l00413"></a>00413 }
|
|
<a name="l00414"></a>00414 <span class="keyword">static</span> <span class="keywordtype">bool</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a19789c4c26c8d9f576de5272f3d41a11">is_lead</a>(<a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a> <span class="comment">/*c*/</span>)
|
|
<a name="l00415"></a>00415 {
|
|
<a name="l00416"></a>00416 <span class="keywordflow">return</span> <span class="keyword">true</span>;
|
|
<a name="l00417"></a>00417 }
|
|
<a name="l00418"></a>00418
|
|
<a name="l00419"></a>00419 <span class="keyword">template</span><<span class="keyword">typename</span> It>
|
|
<a name="l00420"></a>00420 <span class="keyword">static</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a8ff625b2c19b0d4132f7ec9e6303cb36">decode_valid</a>(It &current)
|
|
<a name="l00421"></a>00421 {
|
|
<a name="l00422"></a>00422 <span class="keywordflow">return</span> *current++;
|
|
<a name="l00423"></a>00423 }
|
|
<a name="l00424"></a>00424
|
|
<a name="l00425"></a>00425 <span class="keyword">template</span><<span class="keyword">typename</span> It>
|
|
<a name="l00426"></a>00426 <span class="keyword">static</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a9b6b01fa6705ba67ac78359ddee03213">decode</a>(It &current,It last)
|
|
<a name="l00427"></a>00427 {
|
|
<a name="l00428"></a>00428 <span class="keywordflow">if</span>(BOOST_LOCALE_UNLIKELY(current == last))
|
|
<a name="l00429"></a>00429 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a20dbe458fd18229a0e6c09888d031b38" title="Special constant that defines incomplete code point.">boost::locale::utf::incomplete</a>;
|
|
<a name="l00430"></a>00430 <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> c=*current++;
|
|
<a name="l00431"></a>00431 <span class="keywordflow">if</span>(BOOST_LOCALE_UNLIKELY(!<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a189805c4e9f4c033ce5f88daf780e08e" title="the function checks if v is a valid code point">is_valid_codepoint</a>(c)))
|
|
<a name="l00432"></a>00432 <span class="keywordflow">return</span> <a class="code" href="namespaceboost_1_1locale_1_1utf.html#a30010000878c7732340bda8956b844fb" title="Special constant that defines illegal code point.">boost::locale::utf::illegal</a>;
|
|
<a name="l00433"></a>00433 <span class="keywordflow">return</span> c;
|
|
<a name="l00434"></a>00434 }
|
|
<a name="l00435"></a>00435 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#abb4cb63a924d19505c2cb6e930c68a13">max_width</a> = 1;
|
|
<a name="l00436"></a>00436 <span class="keyword">static</span> <span class="keywordtype">int</span> <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#a26c106ec8816f48431f882017ab46763">width</a>(<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> <span class="comment">/*u*/</span>)
|
|
<a name="l00437"></a>00437 {
|
|
<a name="l00438"></a>00438 <span class="keywordflow">return</span> 1;
|
|
<a name="l00439"></a>00439 }
|
|
<a name="l00440"></a>00440 <span class="keyword">template</span><<span class="keyword">typename</span> It>
|
|
<a name="l00441"></a>00441 <span class="keyword">static</span> It <a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#acd59f628af084f800f8a86cdd8124fd8">encode</a>(<a class="code" href="namespaceboost_1_1locale_1_1utf.html#a068111a6b9d6d465a63893ed5c05e2f8" title="The integral type that can hold a Unicode code point.">code_point</a> u,It out)
|
|
<a name="l00442"></a>00442 {
|
|
<a name="l00443"></a>00443 *out++ = <span class="keyword">static_cast<</span><a class="code" href="structboost_1_1locale_1_1utf_1_1utf__traits.html#accca9dc2d8fe018b9b5640c48e3470e4">char_type</a><span class="keyword">></span>(u);
|
|
<a name="l00444"></a>00444 <span class="keywordflow">return</span> out;
|
|
<a name="l00445"></a>00445 }
|
|
<a name="l00446"></a>00446
|
|
<a name="l00447"></a>00447 }; <span class="comment">// utf32</span>
|
|
<a name="l00448"></a>00448
|
|
<a name="l00449"></a>00449 <span class="preprocessor"> #endif</span>
|
|
<a name="l00450"></a>00450 <span class="preprocessor"></span>
|
|
<a name="l00451"></a>00451
|
|
<a name="l00452"></a>00452 } <span class="comment">// utf</span>
|
|
<a name="l00453"></a>00453 } <span class="comment">// locale</span>
|
|
<a name="l00454"></a>00454 } <span class="comment">// boost</span>
|
|
<a name="l00455"></a>00455
|
|
<a name="l00456"></a>00456
|
|
<a name="l00457"></a>00457 <span class="preprocessor">#endif</span>
|
|
<a name="l00458"></a>00458 <span class="preprocessor"></span>
|
|
<a name="l00459"></a>00459 <span class="comment">// vim: tabstop=4 expandtab shiftwidth=4 softtabstop=4</span>
|
|
<a name="l00460"></a>00460
|
|
</pre></div></div><!-- contents -->
|
|
</div>
|
|
<div id="nav-path" class="navpath">
|
|
<ul>
|
|
<li class="navelem"><b>utf.hpp</b> </li>
|
|
|
|
<li class="footer">
|
|
© Copyright 2009-2012 Artyom Beilis, Distributed under the <a href="http://www.boost.org/LICENSE_1_0.txt">Boost Software License</a>, Version 1.0.
|
|
</li>
|
|
</ul>
|
|
</div>
|
|
|
|
|
|
</body>
|
|
</html>
|