UNPKG

boost-react-native-bundle

Version:

Boost library as in https://sourceforge.net/projects/boost/files/boost/1.57.0/

610 lines (596 loc) 87.6 kB
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> <html xmlns="http://www.w3.org/1999/xhtml"> <head> <meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/> <meta http-equiv="X-UA-Compatible" content="IE=9"/> <title>Boost.Locale: boost/locale/boundary/index.hpp Source File</title> <link href="tabs.css" rel="stylesheet" type="text/css"/> <link href="doxygen.css" rel="stylesheet" type="text/css" /> <link href="navtree.css" rel="stylesheet" type="text/css"/> <script type="text/javascript" src="jquery.js"></script> <script type="text/javascript" src="resize.js"></script> <script type="text/javascript" src="navtree.js"></script> <script type="text/javascript"> $(document).ready(initResizable); </script> </head> <body> <div id="top"><!-- do not remove this div! --> <div id="titlearea"> <table cellspacing="0" cellpadding="0"> <tbody> <tr style="height: 56px;"> <td id="projectlogo"><img alt="Logo" src="boost-small.png"/></td> <td style="padding-left: 0.5em;"> <div id="projectname">Boost.Locale </div> </td> </tr> </tbody> </table> </div> <!-- Generated by Doxygen 1.7.6.1 --> <div id="navrow1" class="tabs"> <ul class="tablist"> <li><a href="index.html"><span>Main&#160;Page</span></a></li> <li><a href="modules.html"><span>Modules</span></a></li> <li><a href="namespaces.html"><span>Namespaces</span></a></li> <li><a href="annotated.html"><span>Classes</span></a></li> <li class="current"><a href="files.html"><span>Files</span></a></li> <li><a href="examples.html"><span>Examples</span></a></li> </ul> </div> <div id="navrow2" class="tabs2"> <ul class="tablist"> <li><a href="files.html"><span>File&#160;List</span></a></li> </ul> </div> </div> <div id="side-nav" class="ui-resizable side-nav-resizable"> <div id="nav-tree"> <div id="nav-tree-contents"> </div> </div> <div id="splitbar" style="-moz-user-select:none;" class="ui-resizable-handle"> </div> </div> <script type="text/javascript"> initNavTree('index_8hpp.html',''); </script> <div id="doc-content"> <div class="header"> <div class="headertitle"> <div class="title">boost/locale/boundary/index.hpp</div> </div> </div><!--header--> <div class="contents"> <div class="fragment"><pre class="fragment"><a name="l00001"></a>00001 <span class="comment">//</span> <a name="l00002"></a>00002 <span class="comment">// Copyright (c) 2009-2011 Artyom Beilis (Tonkikh)</span> <a name="l00003"></a>00003 <span class="comment">//</span> <a name="l00004"></a>00004 <span class="comment">// Distributed under the Boost Software License, Version 1.0. (See</span> <a name="l00005"></a>00005 <span class="comment">// accompanying file LICENSE_1_0.txt or copy at</span> <a name="l00006"></a>00006 <span class="comment">// http://www.boost.org/LICENSE_1_0.txt)</span> <a name="l00007"></a>00007 <span class="comment">//</span> <a name="l00008"></a>00008 <span class="preprocessor">#ifndef BOOST_LOCALE_BOUNDARY_INDEX_HPP_INCLUDED</span> <a name="l00009"></a>00009 <span class="preprocessor"></span><span class="preprocessor">#define BOOST_LOCALE_BOUNDARY_INDEX_HPP_INCLUDED</span> <a name="l00010"></a>00010 <span class="preprocessor"></span> <a name="l00011"></a>00011 <span class="preprocessor">#include &lt;boost/locale/config.hpp&gt;</span> <a name="l00012"></a>00012 <span class="preprocessor">#include &lt;boost/locale/boundary/types.hpp&gt;</span> <a name="l00013"></a>00013 <span class="preprocessor">#include &lt;boost/locale/boundary/facets.hpp&gt;</span> <a name="l00014"></a>00014 <span class="preprocessor">#include &lt;boost/locale/boundary/segment.hpp&gt;</span> <a name="l00015"></a>00015 <span class="preprocessor">#include &lt;boost/locale/boundary/boundary_point.hpp&gt;</span> <a name="l00016"></a>00016 <span class="preprocessor">#include &lt;boost/iterator/iterator_facade.hpp&gt;</span> <a name="l00017"></a>00017 <span class="preprocessor">#include &lt;boost/type_traits/is_same.hpp&gt;</span> <a name="l00018"></a>00018 <span class="preprocessor">#include &lt;boost/shared_ptr.hpp&gt;</span> <a name="l00019"></a>00019 <span class="preprocessor">#include &lt;boost/cstdint.hpp&gt;</span> <a name="l00020"></a>00020 <span class="preprocessor">#include &lt;boost/assert.hpp&gt;</span> <a name="l00021"></a>00021 <span class="preprocessor">#ifdef BOOST_MSVC</span> <a name="l00022"></a>00022 <span class="preprocessor"></span><span class="preprocessor"># pragma warning(push)</span> <a name="l00023"></a>00023 <span class="preprocessor"></span><span class="preprocessor"># pragma warning(disable : 4275 4251 4231 4660)</span> <a name="l00024"></a>00024 <span class="preprocessor"></span><span class="preprocessor">#endif</span> <a name="l00025"></a>00025 <span class="preprocessor"></span><span class="preprocessor">#include &lt;string&gt;</span> <a name="l00026"></a>00026 <span class="preprocessor">#include &lt;locale&gt;</span> <a name="l00027"></a>00027 <span class="preprocessor">#include &lt;vector&gt;</span> <a name="l00028"></a>00028 <span class="preprocessor">#include &lt;iterator&gt;</span> <a name="l00029"></a>00029 <span class="preprocessor">#include &lt;algorithm&gt;</span> <a name="l00030"></a>00030 <span class="preprocessor">#include &lt;stdexcept&gt;</span> <a name="l00031"></a>00031 <a name="l00032"></a>00032 <span class="preprocessor">#include &lt;iostream&gt;</span> <a name="l00033"></a>00033 <a name="l00034"></a>00034 <span class="keyword">namespace </span>boost { <a name="l00035"></a>00035 <a name="l00036"></a>00036 <span class="keyword">namespace </span>locale { <a name="l00037"></a>00037 <a name="l00038"></a>00038 <span class="keyword">namespace </span>boundary { <a name="l00046"></a>00046 <a name="l00048"></a>00048 <a name="l00049"></a>00049 <span class="keyword">namespace </span>details { <a name="l00050"></a>00050 <a name="l00051"></a>00051 template&lt;typename IteratorType,typename CategoryType = typename std::iterator_traits&lt;IteratorType&gt;::iterator_category&gt; <a name="l00052"></a>00052 <span class="keyword">struct </span>mapping_traits { <a name="l00053"></a>00053 <span class="keyword">typedef</span> <span class="keyword">typename</span> std::iterator_traits&lt;IteratorType&gt;::value_type char_type; <a name="l00054"></a>00054 <span class="keyword">static</span> <a class="code" href="group__boundary.html#ga7b4dd7af8fad53fabd77e629da24d466">index_type</a> map(<a class="code" href="group__boundary.html#ga15de9963ce9bb6037c8525901dfbf641">boundary_type</a> t,IteratorType b,IteratorType e,std::locale <span class="keyword">const</span> &amp;l) <a name="l00055"></a>00055 { <a name="l00056"></a>00056 std::basic_string&lt;char_type&gt; str(b,e); <a name="l00057"></a>00057 <span class="keywordflow">return</span> std::use_facet&lt;boundary_indexing&lt;char_type&gt; &gt;(l).map(t,str.c_str(),str.c_str()+str.size()); <a name="l00058"></a>00058 } <a name="l00059"></a>00059 }; <a name="l00060"></a>00060 <a name="l00061"></a>00061 <span class="keyword">template</span>&lt;<span class="keyword">typename</span> CharType,<span class="keyword">typename</span> SomeIteratorType&gt; <a name="l00062"></a>00062 <span class="keyword">struct </span>linear_iterator_traits { <a name="l00063"></a>00063 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">bool</span> is_linear = <a name="l00064"></a>00064 is_same&lt;SomeIteratorType,CharType*&gt;::value <a name="l00065"></a>00065 || is_same&lt;SomeIteratorType,CharType const*&gt;::value <a name="l00066"></a>00066 || is_same&lt;SomeIteratorType,typename std::basic_string&lt;CharType&gt;::iterator&gt;::value <a name="l00067"></a>00067 || is_same&lt;SomeIteratorType,typename std::basic_string&lt;CharType&gt;::const_iterator&gt;::value <a name="l00068"></a>00068 || is_same&lt;SomeIteratorType,typename std::vector&lt;CharType&gt;::iterator&gt;::value <a name="l00069"></a>00069 || is_same&lt;SomeIteratorType,typename std::vector&lt;CharType&gt;::const_iterator&gt;::value <a name="l00070"></a>00070 ; <a name="l00071"></a>00071 }; <a name="l00072"></a>00072 <a name="l00073"></a>00073 <a name="l00074"></a>00074 <a name="l00075"></a>00075 <span class="keyword">template</span>&lt;<span class="keyword">typename</span> IteratorType&gt; <a name="l00076"></a>00076 <span class="keyword">struct </span>mapping_traits&lt;IteratorType,std::random_access_iterator_tag&gt; { <a name="l00077"></a>00077 <a name="l00078"></a>00078 <span class="keyword">typedef</span> <span class="keyword">typename</span> std::iterator_traits&lt;IteratorType&gt;::value_type char_type; <a name="l00079"></a>00079 <a name="l00080"></a>00080 <a name="l00081"></a>00081 <a name="l00082"></a>00082 <span class="keyword">static</span> <a class="code" href="group__boundary.html#ga7b4dd7af8fad53fabd77e629da24d466">index_type</a> map(<a class="code" href="group__boundary.html#ga15de9963ce9bb6037c8525901dfbf641">boundary_type</a> t,IteratorType b,IteratorType e,std::locale <span class="keyword">const</span> &amp;l) <a name="l00083"></a>00083 { <a name="l00084"></a>00084 <a class="code" href="group__boundary.html#ga7b4dd7af8fad53fabd77e629da24d466">index_type</a> result; <a name="l00085"></a>00085 <a name="l00086"></a>00086 <span class="comment">//</span> <a name="l00087"></a>00087 <span class="comment">// Optimize for most common cases</span> <a name="l00088"></a>00088 <span class="comment">//</span> <a name="l00089"></a>00089 <span class="comment">// C++0x requires that string is continious in memory and all known</span> <a name="l00090"></a>00090 <span class="comment">// string implementations</span> <a name="l00091"></a>00091 <span class="comment">// do this because of c_str() support. </span> <a name="l00092"></a>00092 <span class="comment">//</span> <a name="l00093"></a>00093 <a name="l00094"></a>00094 <span class="keywordflow">if</span>(linear_iterator_traits&lt;char_type,IteratorType&gt;::is_linear &amp;&amp; b!=e) <a name="l00095"></a>00095 { <a name="l00096"></a>00096 char_type <span class="keyword">const</span> *begin = &amp;*b; <a name="l00097"></a>00097 char_type <span class="keyword">const</span> *end = begin + (e-b); <a name="l00098"></a>00098 <a class="code" href="group__boundary.html#ga7b4dd7af8fad53fabd77e629da24d466">index_type</a> tmp=std::use_facet&lt;boundary_indexing&lt;char_type&gt; &gt;(l).map(t,begin,end); <a name="l00099"></a>00099 result.swap(tmp); <a name="l00100"></a>00100 } <a name="l00101"></a>00101 <span class="keywordflow">else</span> { <a name="l00102"></a>00102 std::basic_string&lt;char_type&gt; str(b,e); <a name="l00103"></a>00103 <a class="code" href="group__boundary.html#ga7b4dd7af8fad53fabd77e629da24d466">index_type</a> tmp = std::use_facet&lt;boundary_indexing&lt;char_type&gt; &gt;(l).map(t,str.c_str(),str.c_str()+str.size()); <a name="l00104"></a>00104 result.swap(tmp); <a name="l00105"></a>00105 } <a name="l00106"></a>00106 <span class="keywordflow">return</span> result; <a name="l00107"></a>00107 } <a name="l00108"></a>00108 }; <a name="l00109"></a>00109 <a name="l00110"></a>00110 <span class="keyword">template</span>&lt;<span class="keyword">typename</span> BaseIterator&gt; <a name="l00111"></a>00111 <span class="keyword">class </span>mapping { <a name="l00112"></a>00112 <span class="keyword">public</span>: <a name="l00113"></a>00113 <span class="keyword">typedef</span> BaseIterator base_iterator; <a name="l00114"></a>00114 <span class="keyword">typedef</span> <span class="keyword">typename</span> std::iterator_traits&lt;base_iterator&gt;::value_type char_type; <a name="l00115"></a>00115 <a name="l00116"></a>00116 <a name="l00117"></a>00117 mapping(<a class="code" href="group__boundary.html#ga15de9963ce9bb6037c8525901dfbf641">boundary_type</a> type, <a name="l00118"></a>00118 base_iterator begin, <a name="l00119"></a>00119 base_iterator end, <a name="l00120"></a>00120 std::locale <span class="keyword">const</span> &amp;loc) <a name="l00121"></a>00121 : <a name="l00122"></a>00122 index_(new <a class="code" href="group__boundary.html#ga7b4dd7af8fad53fabd77e629da24d466">index_type</a>()), <a name="l00123"></a>00123 begin_(begin), <a name="l00124"></a>00124 end_(end) <a name="l00125"></a>00125 { <a name="l00126"></a>00126 <a class="code" href="group__boundary.html#ga7b4dd7af8fad53fabd77e629da24d466">index_type</a> idx=details::mapping_traits&lt;base_iterator&gt;::map(type,begin,end,loc); <a name="l00127"></a>00127 index_-&gt;swap(idx); <a name="l00128"></a>00128 } <a name="l00129"></a>00129 <a name="l00130"></a>00130 mapping() <a name="l00131"></a>00131 { <a name="l00132"></a>00132 } <a name="l00133"></a>00133 <a name="l00134"></a>00134 <a class="code" href="group__boundary.html#ga7b4dd7af8fad53fabd77e629da24d466">index_type</a> <span class="keyword">const</span> &amp;index()<span class="keyword"> const</span> <a name="l00135"></a>00135 <span class="keyword"> </span>{ <a name="l00136"></a>00136 <span class="keywordflow">return</span> *index_; <a name="l00137"></a>00137 } <a name="l00138"></a>00138 <a name="l00139"></a>00139 base_iterator begin()<span class="keyword"> const</span> <a name="l00140"></a>00140 <span class="keyword"> </span>{ <a name="l00141"></a>00141 <span class="keywordflow">return</span> begin_; <a name="l00142"></a>00142 } <a name="l00143"></a>00143 <a name="l00144"></a>00144 base_iterator end()<span class="keyword"> const</span> <a name="l00145"></a>00145 <span class="keyword"> </span>{ <a name="l00146"></a>00146 <span class="keywordflow">return</span> end_; <a name="l00147"></a>00147 } <a name="l00148"></a>00148 <a name="l00149"></a>00149 <span class="keyword">private</span>: <a name="l00150"></a>00150 boost::shared_ptr&lt;index_type&gt; index_; <a name="l00151"></a>00151 base_iterator begin_,end_; <a name="l00152"></a>00152 }; <a name="l00153"></a>00153 <a name="l00154"></a>00154 <span class="keyword">template</span>&lt;<span class="keyword">typename</span> BaseIterator&gt; <a name="l00155"></a>00155 <span class="keyword">class </span>segment_index_iterator : <a name="l00156"></a>00156 <span class="keyword">public</span> boost::iterator_facade&lt; <a name="l00157"></a>00157 segment_index_iterator&lt;BaseIterator&gt;, <a name="l00158"></a>00158 segment&lt;BaseIterator&gt;, <a name="l00159"></a>00159 boost::bidirectional_traversal_tag, <a name="l00160"></a>00160 segment&lt;BaseIterator&gt; const &amp; <a name="l00161"></a>00161 &gt; <a name="l00162"></a>00162 { <a name="l00163"></a>00163 <span class="keyword">public</span>: <a name="l00164"></a>00164 <span class="keyword">typedef</span> BaseIterator base_iterator; <a name="l00165"></a>00165 <span class="keyword">typedef</span> mapping&lt;base_iterator&gt; mapping_type; <a name="l00166"></a>00166 <span class="keyword">typedef</span> segment&lt;base_iterator&gt; segment_type; <a name="l00167"></a>00167 <a name="l00168"></a>00168 segment_index_iterator() : current_(0,0),map_(0) <a name="l00169"></a>00169 { <a name="l00170"></a>00170 } <a name="l00171"></a>00171 <a name="l00172"></a>00172 segment_index_iterator(base_iterator p,mapping_type <span class="keyword">const</span> *map,<a class="code" href="group__boundary.html#ga25e193c81052ef1795f1b53b46bc2095" title="Flags used with word boundary analysis -- the type of the word, line or sentence boundary found...">rule_type</a> mask,<span class="keywordtype">bool</span> full_select) : <a name="l00173"></a>00173 map_(map), <a name="l00174"></a>00174 mask_(mask), <a name="l00175"></a>00175 full_select_(full_select) <a name="l00176"></a>00176 { <a name="l00177"></a>00177 <span class="keyword">set</span>(p); <a name="l00178"></a>00178 } <a name="l00179"></a>00179 segment_index_iterator(<span class="keywordtype">bool</span> is_begin,mapping_type <span class="keyword">const</span> *map,<a class="code" href="group__boundary.html#ga25e193c81052ef1795f1b53b46bc2095" title="Flags used with word boundary analysis -- the type of the word, line or sentence boundary found...">rule_type</a> mask,<span class="keywordtype">bool</span> full_select) : <a name="l00180"></a>00180 map_(map), <a name="l00181"></a>00181 mask_(mask), <a name="l00182"></a>00182 full_select_(full_select) <a name="l00183"></a>00183 { <a name="l00184"></a>00184 <span class="keywordflow">if</span>(is_begin) <a name="l00185"></a>00185 set_begin(); <a name="l00186"></a>00186 <span class="keywordflow">else</span> <a name="l00187"></a>00187 set_end(); <a name="l00188"></a>00188 } <a name="l00189"></a>00189 <a name="l00190"></a>00190 segment_type <span class="keyword">const</span> &amp;dereference()<span class="keyword"> const</span> <a name="l00191"></a>00191 <span class="keyword"> </span>{ <a name="l00192"></a>00192 <span class="keywordflow">return</span> value_; <a name="l00193"></a>00193 } <a name="l00194"></a>00194 <a name="l00195"></a>00195 <span class="keywordtype">bool</span> equal(segment_index_iterator <span class="keyword">const</span> &amp;other)<span class="keyword"> const</span> <a name="l00196"></a>00196 <span class="keyword"> </span>{ <a name="l00197"></a>00197 <span class="keywordflow">return</span> map_ == other.map_ &amp;&amp; current_.second == other.current_.second; <a name="l00198"></a>00198 } <a name="l00199"></a>00199 <a name="l00200"></a>00200 <span class="keywordtype">void</span> increment() <a name="l00201"></a>00201 { <a name="l00202"></a>00202 std::pair&lt;size_t,size_t&gt; next = current_; <a name="l00203"></a>00203 <span class="keywordflow">if</span>(full_select_) { <a name="l00204"></a>00204 next.first = next.second; <a name="l00205"></a>00205 <span class="keywordflow">while</span>(next.second &lt; size()) { <a name="l00206"></a>00206 next.second++; <a name="l00207"></a>00207 <span class="keywordflow">if</span>(valid_offset(next.second)) <a name="l00208"></a>00208 <span class="keywordflow">break</span>; <a name="l00209"></a>00209 } <a name="l00210"></a>00210 <span class="keywordflow">if</span>(next.second == size()) <a name="l00211"></a>00211 next.first = next.second - 1; <a name="l00212"></a>00212 } <a name="l00213"></a>00213 <span class="keywordflow">else</span> { <a name="l00214"></a>00214 <span class="keywordflow">while</span>(next.second &lt; size()) { <a name="l00215"></a>00215 next.first = next.second; <a name="l00216"></a>00216 next.second++; <a name="l00217"></a>00217 <span class="keywordflow">if</span>(valid_offset(next.second)) <a name="l00218"></a>00218 <span class="keywordflow">break</span>; <a name="l00219"></a>00219 } <a name="l00220"></a>00220 } <a name="l00221"></a>00221 update_current(next); <a name="l00222"></a>00222 } <a name="l00223"></a>00223 <a name="l00224"></a>00224 <span class="keywordtype">void</span> decrement() <a name="l00225"></a>00225 { <a name="l00226"></a>00226 std::pair&lt;size_t,size_t&gt; next = current_; <a name="l00227"></a>00227 <span class="keywordflow">if</span>(full_select_) { <a name="l00228"></a>00228 <span class="keywordflow">while</span>(next.second &gt;1) { <a name="l00229"></a>00229 next.second--; <a name="l00230"></a>00230 <span class="keywordflow">if</span>(valid_offset(next.second)) <a name="l00231"></a>00231 <span class="keywordflow">break</span>; <a name="l00232"></a>00232 } <a name="l00233"></a>00233 next.first = next.second; <a name="l00234"></a>00234 <span class="keywordflow">while</span>(next.first &gt;0) { <a name="l00235"></a>00235 next.first--; <a name="l00236"></a>00236 <span class="keywordflow">if</span>(valid_offset(next.first)) <a name="l00237"></a>00237 <span class="keywordflow">break</span>; <a name="l00238"></a>00238 } <a name="l00239"></a>00239 } <a name="l00240"></a>00240 <span class="keywordflow">else</span> { <a name="l00241"></a>00241 <span class="keywordflow">while</span>(next.second &gt;1) { <a name="l00242"></a>00242 next.second--; <a name="l00243"></a>00243 <span class="keywordflow">if</span>(valid_offset(next.second)) <a name="l00244"></a>00244 <span class="keywordflow">break</span>; <a name="l00245"></a>00245 } <a name="l00246"></a>00246 next.first = next.second - 1; <a name="l00247"></a>00247 } <a name="l00248"></a>00248 update_current(next); <a name="l00249"></a>00249 } <a name="l00250"></a>00250 <a name="l00251"></a>00251 <span class="keyword">private</span>: <a name="l00252"></a>00252 <a name="l00253"></a>00253 <span class="keywordtype">void</span> set_end() <a name="l00254"></a>00254 { <a name="l00255"></a>00255 current_.first = size() - 1; <a name="l00256"></a>00256 current_.second = size(); <a name="l00257"></a>00257 value_ = segment_type(map_-&gt;end(),map_-&gt;end(),0); <a name="l00258"></a>00258 } <a name="l00259"></a>00259 <span class="keywordtype">void</span> set_begin() <a name="l00260"></a>00260 { <a name="l00261"></a>00261 current_.first = current_.second = 0; <a name="l00262"></a>00262 value_ = segment_type(map_-&gt;begin(),map_-&gt;begin(),0); <a name="l00263"></a>00263 increment(); <a name="l00264"></a>00264 } <a name="l00265"></a>00265 <a name="l00266"></a>00266 <span class="keywordtype">void</span> <span class="keyword">set</span>(base_iterator p) <a name="l00267"></a>00267 { <a name="l00268"></a>00268 <span class="keywordtype">size_t</span> dist=std::distance(map_-&gt;begin(),p); <a name="l00269"></a>00269 index_type::const_iterator b=map_-&gt;index().begin(),e=map_-&gt;index().end(); <a name="l00270"></a>00270 index_type::const_iterator <a name="l00271"></a>00271 boundary_point=std::upper_bound(b,e,break_info(dist)); <a name="l00272"></a>00272 <span class="keywordflow">while</span>(boundary_point != e &amp;&amp; (boundary_point-&gt;rule &amp; mask_)==0) <a name="l00273"></a>00273 boundary_point++; <a name="l00274"></a>00274 <a name="l00275"></a>00275 current_.first = current_.second = boundary_point - b; <a name="l00276"></a>00276 <a name="l00277"></a>00277 <span class="keywordflow">if</span>(full_select_) { <a name="l00278"></a>00278 <span class="keywordflow">while</span>(current_.first &gt; 0) { <a name="l00279"></a>00279 current_.first --; <a name="l00280"></a>00280 <span class="keywordflow">if</span>(valid_offset(current_.first)) <a name="l00281"></a>00281 <span class="keywordflow">break</span>; <a name="l00282"></a>00282 } <a name="l00283"></a>00283 } <a name="l00284"></a>00284 <span class="keywordflow">else</span> { <a name="l00285"></a>00285 <span class="keywordflow">if</span>(current_.first &gt; 0) <a name="l00286"></a>00286 current_.first --; <a name="l00287"></a>00287 } <a name="l00288"></a>00288 value_.first = map_-&gt;begin(); <a name="l00289"></a>00289 std::advance(value_.first,get_offset(current_.first)); <a name="l00290"></a>00290 value_.second = value_.first; <a name="l00291"></a>00291 std::advance(value_.second,get_offset(current_.second) - get_offset(current_.first)); <a name="l00292"></a>00292 <a name="l00293"></a>00293 update_rule(); <a name="l00294"></a>00294 } <a name="l00295"></a>00295 <a name="l00296"></a>00296 <span class="keywordtype">void</span> update_current(std::pair&lt;size_t,size_t&gt; pos) <a name="l00297"></a>00297 { <a name="l00298"></a>00298 std::ptrdiff_t first_diff = get_offset(pos.first) - get_offset(current_.first); <a name="l00299"></a>00299 std::ptrdiff_t second_diff = get_offset(pos.second) - get_offset(current_.second); <a name="l00300"></a>00300 std::advance(value_.first,first_diff); <a name="l00301"></a>00301 std::advance(value_.second,second_diff); <a name="l00302"></a>00302 current_ = pos; <a name="l00303"></a>00303 update_rule(); <a name="l00304"></a>00304 } <a name="l00305"></a>00305 <a name="l00306"></a>00306 <span class="keywordtype">void</span> update_rule() <a name="l00307"></a>00307 { <a name="l00308"></a>00308 <span class="keywordflow">if</span>(current_.second != size()) { <a name="l00309"></a>00309 value_.rule(index()[current_.second].rule); <a name="l00310"></a>00310 } <a name="l00311"></a>00311 } <a name="l00312"></a>00312 <span class="keywordtype">size_t</span> get_offset(<span class="keywordtype">size_t</span> ind)<span class="keyword"> const</span> <a name="l00313"></a>00313 <span class="keyword"> </span>{ <a name="l00314"></a>00314 <span class="keywordflow">if</span>(ind == size()) <a name="l00315"></a>00315 <span class="keywordflow">return</span> index().back().offset; <a name="l00316"></a>00316 <span class="keywordflow">return</span> index()[ind].offset; <a name="l00317"></a>00317 } <a name="l00318"></a>00318 <a name="l00319"></a>00319 <span class="keywordtype">bool</span> valid_offset(<span class="keywordtype">size_t</span> offset)<span class="keyword"> const</span> <a name="l00320"></a>00320 <span class="keyword"> </span>{ <a name="l00321"></a>00321 <span class="keywordflow">return</span> offset == 0 <a name="l00322"></a>00322 || offset == size() <span class="comment">// make sure we not acess index[size]</span> <a name="l00323"></a>00323 || (index()[offset].rule &amp; mask_)!=0; <a name="l00324"></a>00324 } <a name="l00325"></a>00325 <a name="l00326"></a>00326 <span class="keywordtype">size_t</span> size()<span class="keyword"> const</span> <a name="l00327"></a>00327 <span class="keyword"> </span>{ <a name="l00328"></a>00328 <span class="keywordflow">return</span> index().size(); <a name="l00329"></a>00329 } <a name="l00330"></a>00330 <a name="l00331"></a>00331 <a class="code" href="group__boundary.html#ga7b4dd7af8fad53fabd77e629da24d466">index_type</a> <span class="keyword">const</span> &amp;index()<span class="keyword"> const</span> <a name="l00332"></a>00332 <span class="keyword"> </span>{ <a name="l00333"></a>00333 <span class="keywordflow">return</span> map_-&gt;index(); <a name="l00334"></a>00334 } <a name="l00335"></a>00335 <a name="l00336"></a>00336 <a name="l00337"></a>00337 segment_type value_; <a name="l00338"></a>00338 std::pair&lt;size_t,size_t&gt; current_; <a name="l00339"></a>00339 mapping_type <span class="keyword">const</span> *map_; <a name="l00340"></a>00340 <a class="code" href="group__boundary.html#ga25e193c81052ef1795f1b53b46bc2095" title="Flags used with word boundary analysis -- the type of the word, line or sentence boundary found...">rule_type</a> mask_; <a name="l00341"></a>00341 <span class="keywordtype">bool</span> full_select_; <a name="l00342"></a>00342 }; <a name="l00343"></a>00343 <a name="l00344"></a>00344 <span class="keyword">template</span>&lt;<span class="keyword">typename</span> BaseIterator&gt; <a name="l00345"></a>00345 <span class="keyword">class </span>boundary_point_index_iterator : <a name="l00346"></a>00346 <span class="keyword">public</span> boost::iterator_facade&lt; <a name="l00347"></a>00347 boundary_point_index_iterator&lt;BaseIterator&gt;, <a name="l00348"></a>00348 boundary_point&lt;BaseIterator&gt;, <a name="l00349"></a>00349 boost::bidirectional_traversal_tag, <a name="l00350"></a>00350 boundary_point&lt;BaseIterator&gt; const &amp; <a name="l00351"></a>00351 &gt; <a name="l00352"></a>00352 { <a name="l00353"></a>00353 <span class="keyword">public</span>: <a name="l00354"></a>00354 <span class="keyword">typedef</span> BaseIterator base_iterator; <a name="l00355"></a>00355 <span class="keyword">typedef</span> mapping&lt;base_iterator&gt; mapping_type; <a name="l00356"></a>00356 <span class="keyword">typedef</span> boundary_point&lt;base_iterator&gt; boundary_point_type; <a name="l00357"></a>00357 <a name="l00358"></a>00358 boundary_point_index_iterator() : current_(0),map_(0) <a name="l00359"></a>00359 { <a name="l00360"></a>00360 } <a name="l00361"></a>00361 <a name="l00362"></a>00362 boundary_point_index_iterator(<span class="keywordtype">bool</span> is_begin,mapping_type <span class="keyword">const</span> *map,<a class="code" href="group__boundary.html#ga25e193c81052ef1795f1b53b46bc2095" title="Flags used with word boundary analysis -- the type of the word, line or sentence boundary found...">rule_type</a> mask) : <a name="l00363"></a>00363 map_(map), <a name="l00364"></a>00364 mask_(mask) <a name="l00365"></a>00365 { <a name="l00366"></a>00366 <span class="keywordflow">if</span>(is_begin) <a name="l00367"></a>00367 set_begin(); <a name="l00368"></a>00368 <span class="keywordflow">else</span> <a name="l00369"></a>00369 set_end(); <a name="l00370"></a>00370 } <a name="l00371"></a>00371 boundary_point_index_iterator(base_iterator p,mapping_type <span class="keyword">const</span> *map,<a class="code" href="group__boundary.html#ga25e193c81052ef1795f1b53b46bc2095" title="Flags used with word boundary analysis -- the type of the word, line or sentence boundary found...">rule_type</a> mask) : <a name="l00372"></a>00372 map_(map), <a name="l00373"></a>00373 mask_(mask) <a name="l00374"></a>00374 { <a name="l00375"></a>00375 <span class="keyword">set</span>(p); <a name="l00376"></a>00376 } <a name="l00377"></a>00377 <a name="l00378"></a>00378 boundary_point_type <span class="keyword">const</span> &amp;dereference()<span class="keyword"> const</span> <a name="l00379"></a>00379 <span class="keyword"> </span>{ <a name="l00380"></a>00380 <span class="keywordflow">return</span> value_; <a name="l00381"></a>00381 } <a name="l00382"></a>00382 <a name="l00383"></a>00383 <span class="keywordtype">bool</span> equal(boundary_point_index_iterator <span class="keyword">const</span> &amp;other)<span class="keyword"> const</span> <a name="l00384"></a>00384 <span class="keyword"> </span>{ <a name="l00385"></a>00385 <span class="keywordflow">return</span> map_ == other.map_ &amp;&amp; current_ == other.current_; <a name="l00386"></a>00386 } <a name="l00387"></a>00387 <a name="l00388"></a>00388 <span class="keywordtype">void</span> increment() <a name="l00389"></a>00389 { <a name="l00390"></a>00390 <span class="keywordtype">size_t</span> next = current_; <a name="l00391"></a>00391 <span class="keywordflow">while</span>(next &lt; size()) { <a name="l00392"></a>00392 next++; <a name="l00393"></a>00393 <span class="keywordflow">if</span>(valid_offset(next)) <a name="l00394"></a>00394 <span class="keywordflow">break</span>; <a name="l00395"></a>00395 } <a name="l00396"></a>00396 update_current(next); <a name="l00397"></a>00397 } <a name="l00398"></a>00398 <a name="l00399"></a>00399 <span class="keywordtype">void</span> decrement() <a name="l00400"></a>00400 { <a name="l00401"></a>00401 <span class="keywordtype">size_t</span> next = current_; <a name="l00402"></a>00402 <span class="keywordflow">while</span>(next&gt;0) { <a name="l00403"></a>00403 next--; <a name="l00404"></a>00404 <span class="keywordflow">if</span>(valid_offset(next)) <a name="l00405"></a>00405 <span class="keywordflow">break</span>; <a name="l00406"></a>00406 } <a name="l00407"></a>00407 update_current(next); <a name="l00408"></a>00408 } <a name="l00409"></a>00409 <a name="l00410"></a>00410 <span class="keyword">private</span>: <a name="l00411"></a>00411 <span class="keywordtype">void</span> set_end() <a name="l00412"></a>00412 { <a name="l00413"></a>00413 current_ = size(); <a name="l00414"></a>00414 value_ = boundary_point_type(map_-&gt;end(),0); <a name="l00415"></a>00415 } <a name="l00416"></a>00416 <span class="keywordtype">void</span> set_begin() <a name="l00417"></a>00417 { <a name="l00418"></a>00418 current_ = 0; <a name="l00419"></a>00419 value_ = boundary_point_type(map_-&gt;begin(),0); <a name="l00420"></a>00420 } <a name="l00421"></a>00421 <a name="l00422"></a>00422 <span class="keywordtype">void</span> <span class="keyword">set</span>(base_iterator p) <a name="l00423"></a>00423 { <a name="l00424"></a>00424 <span class="keywordtype">size_t</span> dist = std::distance(map_-&gt;begin(),p); <a name="l00425"></a>00425 <a name="l00426"></a>00426 index_type::const_iterator b=index().begin(); <a name="l00427"></a>00427 index_type::const_iterator e=index().end(); <a name="l00428"></a>00428 index_type::const_iterator ptr = std::lower_bound(b,e,break_info(dist)); <a name="l00429"></a>00429 <a name="l00430"></a>00430 <span class="keywordflow">if</span>(ptr==index().end()) <a name="l00431"></a>00431 current_=size()-1; <a name="l00432"></a>00432 <span class="keywordflow">else</span> <a name="l00433"></a>00433 current_=ptr - index().begin(); <a name="l00434"></a>00434 <a name="l00435"></a>00435 <span class="keywordflow">while</span>(!valid_offset(current_)) <a name="l00436"></a>00436 current_ ++; <a name="l00437"></a>00437 <a name="l00438"></a>00438 std::ptrdiff_t diff = get_offset(current_) - dist; <a name="l00439"></a>00439 std::advance(p,diff); <a name="l00440"></a>00440 value_.iterator(p); <a name="l00441"></a>00441 update_rule(); <a name="l00442"></a>00442 } <a name="l00443"></a>00443 <a name="l00444"></a>00444 <span class="keywordtype">void</span> update_current(<span class="keywordtype">size_t</span> pos) <a name="l00445"></a>00445 { <a name="l00446"></a>00446 std::ptrdiff_t diff = get_offset(pos) - get_offset(current_); <a name="l00447"></a>00447 base_iterator i=value_.iterator(); <a name="l00448"></a>00448 std::advance(i,diff); <a name="l00449"></a>00449 current_ = pos; <a name="l00450"></a>00450 value_.iterator(i); <a name="l00451"></a>00451 update_rule(); <a name="l00452"></a>00452 } <a name="l00453"></a>00453 <a name="l00454"></a>00454 <span class="keywordtype">void</span> update_rule() <a name="l00455"></a>00455 { <a name="l00456"></a>00456 <span class="keywordflow">if</span>(current_ != size()) { <a name="l00457"></a>00457 value_.rule(index()[current_].rule); <a name="l00458"></a>00458 } <a name="l00459"></a>00459 } <a name="l00460"></a>00460 <span class="keywordtype">size_t</span> get_offset(<span class="keywordtype">size_t</span> ind)<span class="keyword"> const</span> <a name="l00461"></a>00461 <span class="keyword"> </span>{ <a name="l00462"></a>00462 <span class="keywordflow">if</span>(ind == size()) <a name="l00463"></a>00463 <span class="keywordflow">return</span> index().back().offset; <a name="l00464"></a>00464 <span class="keywordflow">return</span> index()[ind].offset; <a name="l00465"></a>00465 } <a name="l00466"></a>00466 <a name="l00467"></a>00467 <span class="keywordtype">bool</span> valid_offset(<span class="keywordtype">size_t</span> offset)<span class="keyword"> const</span> <a name="l00468"></a>00468 <span class="keyword"> </span>{ <a name="l00469"></a>00469 <span class="keywordflow">return</span> offset == 0 <a name="l00470"></a>00470 || offset + 1 &gt;= size() <span class="comment">// last and first are always valid regardless of mark</span> <a name="l00471"></a>00471 || (index()[offset].rule &amp; mask_)!=0; <a name="l00472"></a>00472 } <a name="l00473"></a>00473 <a name="l00474"></a>00474 <span class="keywordtype">size_t</span> size()<span class="keyword"> const</span> <a name="l00475"></a>00475 <span class="keyword"> </span>{ <a name="l00476"></a>00476 <span class="keywordflow">return</span> index().size(); <a name="l00477"></a>00477 } <a name="l00478"></a>00478 <a name="l00479"></a>00479 <a class="code" href="group__boundary.html#ga7b4dd7af8fad53fabd77e629da24d466">index_type</a> <span class="keyword">const</span> &amp;index()<span class="keyword"> const</span> <a name="l00480"></a>00480 <span class="keyword"> </span>{ <a name="l00481"></a>00481 <span class="keywordflow">return</span> map_-&gt;index(); <a name="l00482"></a>00482 } <a name="l00483"></a>00483 <a name="l00484"></a>00484 <a name="l00485"></a>00485 boundary_point_type value_; <a name="l00486"></a>00486 <span class="keywordtype">size_t</span> current_; <a name="l00487"></a>00487 mapping_type <span class="keyword">const</span> *map_; <a name="l00488"></a>00488 <a class="code" href="group__boundary.html#ga25e193c81052ef1795f1b53b46bc2095" title="Flags used with word boundary analysis -- the type of the word, line or sentence boundary found...">rule_type</a> mask_; <a name="l00489"></a>00489 }; <a name="l00490"></a>00490 <a name="l00491"></a>00491 <a name="l00492"></a>00492 } <span class="comment">// details</span> <a name="l00493"></a>00493 <a name="l00495"></a>00495 <a name="l00496"></a>00496 <span class="keyword">template</span>&lt;<span class="keyword">typename</span> BaseIterator&gt; <a name="l00497"></a>00497 <span class="keyword">class </span>segment_index; <a name="l00498"></a>00498 <a name="l00499"></a>00499 <span class="keyword">template</span>&lt;<span class="keyword">typename</span> BaseIterator&gt; <a name="l00500"></a>00500 <span class="keyword">class </span>boundary_point_index; <a name="l00501"></a>00501 <a name="l00502"></a>00502 <a name="l00554"></a>00554 <a name="l00555"></a>00555 <span class="keyword">template</span>&lt;<span class="keyword">typename</span> BaseIterator&gt; <a name="l00556"></a><a class="code" href="classboost_1_1locale_1_1boundary_1_1segment__index.html">00556</a> <span class="keyword">class </span><a class="code" href="classboost_1_1locale_1_1boundary_1_1segment__index.html" title="This class holds an index of segments in the text range and allows to iterate over them...">segment_index</a> { <a name="l00557"></a>00557 <span class="keyword">public</span>: <a name="l00558"></a>00558 <a name="l00562"></a><a class="code" href="group__boundary.html#ga06f2faacb9d196ebc659ad5382ea2ca5">00562</a> <span class="keyword">typedef</span> BaseIterator <a class="code" href="group__boundary.html#ga06f2faacb9d196ebc659ad5382ea2ca5">base_iterator</a>; <a name="l00563"></a>00563 <span class="preprocessor"> #ifdef BOOST_LOCALE_DOXYGEN</span> <a name="l00564"></a>00564 <span class="preprocessor"></span> <a name="l00565"></a>00565 <a name="l00566"></a>00566 <a name="l00567"></a>00567 <a name="l00568"></a>00568 <a name="l00569"></a>00569 <a name="l00570"></a>00570 <a name="l00571"></a>00571 <a name="l00572"></a>00572 <a name="l00573"></a>00573 <a name="l00574"></a>00574 <a name="l00575"></a>00575 <a name="l00576"></a>00576 <a name="l00577"></a>00577 <a name="l00578"></a><a class="code" href="group__boundary.html#gaf7a775e77dbbca3495e11d646df96fd2">00578</a> <span class="keyword">typedef</span> unspecified_iterator_type <a class="code" href="group__boundary.html#gaf7a775e77dbbca3495e11d646df96fd2">iterator</a>; <a name="l00582"></a><a class="code" href="group__boundary.html#ga5f8e61b5babc3f0fa95f5fb8acae3724">00582</a> <span class="keyword">typedef</span> unspecified_iterator_type <a class="code" href="group__boundary.html#ga5f8e61b5babc3f0fa95f5fb8acae3724">const_iterator</a>; <a name="l00583"></a>00583 <span class="preprocessor"> #else</span> <a name="l00584"></a>00584 <span class="preprocessor"></span> <span class="keyword">typedef</span> details::segment_index_iterator&lt;base_iterator&gt; <a class="code" href="group__boundary.html#gaf7a775e77dbbca3495e11d646df96fd2">iterator</a>; <a name="l00585"></a>00585 <span class="keyword">typedef</span> details::segment_index_iterator&lt;base_iterator&gt; <a class="code" href="group__boundary.html#ga5f8e61b5babc3f0fa95f5fb8acae3724">const_iterator</a>; <a name="l00586"></a>00586 <span class="preprocessor"> #endif</span> <a name="l00587"></a>00587 <span class="preprocessor"></span> <a name="l00588"></a>00588 <a name="l00589"></a>00589 <a name="l00590"></a>00590 <a name="l00591"></a><a class="code" href="group__boundary.html#ga067c663d18faee08adb3355701ae72ba">00591</a> <span class="keyword">typedef</span> <a class="code" href="classboost_1_1locale_1_1boundary_1_1segment.html" title="a segment object that represents a pair of two iterators that define the range where this segment exi...">segment&lt;base_iterator&gt;</a> <a class="code" href="group__boundary.html#ga067c663d18faee08adb3355701ae72ba">value_type</a>; <a name="l00592"></a>00592 <a name="l00602"></a><a class="code" href="group__boundary.html#ga2c354f4cc03677b58c97038cd84dc465">00602</a> <a class="code" href="group__boundary.html#ga2c354f4cc03677b58c97038cd84dc465">segment_index</a>() : mask_(0xFFFFFFFFu),full_select_(false) <a name="l00603"></a>00603 { <a name="l00604"></a>00604 } <a name="l00609"></a><a class="code" href="group__boundary.html#ga06ddc335e95479ec51e9b16d0f829bb3">00609</