Updated the documentation to have a better intro sample
git-svn-id: http://svn.code.sf.net/p/utfcpp/code@90 a809a056-fc17-0410-9590-b4f493f8b08e
This commit is contained in:
parent
4039d395d5
commit
a13d284b20
1 changed files with 14 additions and 18 deletions
|
@ -57,6 +57,10 @@
|
||||||
</li>
|
</li>
|
||||||
<li>
|
<li>
|
||||||
<a href="#examples">Examples of Use</a>
|
<a href="#examples">Examples of Use</a>
|
||||||
|
<ul class="toc">
|
||||||
|
<li>
|
||||||
|
<a href=#introsample>Introductionary Sample </a>
|
||||||
|
</li>
|
||||||
</li>
|
</li>
|
||||||
<li>
|
<li>
|
||||||
<a href="#reference">Reference</a>
|
<a href="#reference">Reference</a>
|
||||||
|
@ -115,11 +119,13 @@
|
||||||
<h2 id="examples">
|
<h2 id="examples">
|
||||||
Examples of use
|
Examples of use
|
||||||
</h2>
|
</h2>
|
||||||
|
<h3 id="introsample">
|
||||||
|
Introductionary Sample
|
||||||
|
</h3>
|
||||||
<p>
|
<p>
|
||||||
To illustrate the use of this utf8 library, we shall open a file containing UTF-8
|
To illustrate the use of this utf8 library, let's start with a small but complete program
|
||||||
encoded text, check whether it starts with a byte order mark, read each line into a
|
that opens a file containing UTF-8 encoded text, reads it line by line, checks each line
|
||||||
<code>std::string</code>, check it for validity, convert the text to UTF-16, and
|
for invalid UTF-8 byte sequences, and converts it to UTF-16 encoding and back to UTF-8:
|
||||||
back to UTF-8:
|
|
||||||
</p>
|
</p>
|
||||||
<pre>
|
<pre>
|
||||||
<span class="preprocessor">#include <fstream></span>
|
<span class="preprocessor">#include <fstream></span>
|
||||||
|
@ -135,26 +141,17 @@
|
||||||
<span class="keyword">return</span> <span class="literal">0</span>;
|
<span class="keyword">return</span> <span class="literal">0</span>;
|
||||||
}
|
}
|
||||||
<span class="keyword">const char</span>* test_file_path = argv[1];
|
<span class="keyword">const char</span>* test_file_path = argv[1];
|
||||||
<span class="comment">// Open the test file (must be UTF-8 encoded)</span>
|
<span class="comment">// Open the test file (contains UTF-8 encoded text)</span>
|
||||||
ifstream fs8(test_file_path);
|
ifstream fs8(test_file_path);
|
||||||
<span class="keyword">if</span> (!fs8.is_open()) {
|
<span class="keyword">if</span> (!fs8.is_open()) {
|
||||||
cout << <span class=
|
cout << <span class=
|
||||||
"literal">"Could not open "</span> << test_file_path << endl;
|
"literal">"Could not open "</span> << test_file_path << endl;
|
||||||
<span class="keyword">return</span> <span class="literal">0</span>;
|
<span class="keyword">return</span> <span class="literal">0</span>;
|
||||||
}
|
}
|
||||||
<span class="comment">// Read the first line of the file</span>
|
|
||||||
<span class="keyword">unsigned</span> line_count = <span class="literal">1</span>;
|
<span class="keyword">unsigned</span> line_count = <span class="literal">1</span>;
|
||||||
string line;
|
string line;
|
||||||
<span class="keyword">if</span> (!getline(fs8, line))
|
|
||||||
<span class="keyword">return</span> <span class="literal">0</span>;
|
|
||||||
<span class="comment">// Look for utf-8 byte-order mark at the beginning</span>
|
|
||||||
<span class="keyword">if</span> (line.size() > <span class="literal">2</span>) {
|
|
||||||
<span class="keyword">if</span> (utf8::is_bom(line.c_str()))
|
|
||||||
cout << <span class=
|
|
||||||
"literal">"There is a byte order mark at the beginning of the file\n"</span>;
|
|
||||||
}
|
|
||||||
<span class="comment">// Play with all the lines in the file</span>
|
<span class="comment">// Play with all the lines in the file</span>
|
||||||
<span class="keyword">do</span> {
|
<span class="keyword">while</span> (getline(fs8, line)) {
|
||||||
<span class="comment">// check for invalid utf-8 (for a simple yes/no check, there is also utf8::is_valid function)</span>
|
<span class="comment">// check for invalid utf-8 (for a simple yes/no check, there is also utf8::is_valid function)</span>
|
||||||
string::iterator end_it = utf8::find_invalid(line.begin(), line.end());
|
string::iterator end_it = utf8::find_invalid(line.begin(), line.end());
|
||||||
<span class="keyword">if</span> (end_it != line.end()) {
|
<span class="keyword">if</span> (end_it != line.end()) {
|
||||||
|
@ -181,11 +178,10 @@
|
||||||
cout << <span class=
|
cout << <span class=
|
||||||
"literal">"Error in UTF-16 conversion at line: "</span> << line_count << <span
|
"literal">"Error in UTF-16 conversion at line: "</span> << line_count << <span
|
||||||
class="literal">"\n"</span>;
|
class="literal">"\n"</span>;
|
||||||
getline(fs8, line);
|
|
||||||
line_count++;
|
line_count++;
|
||||||
} <span class="keyword">while</span> (!fs8.eof());
|
|
||||||
<span class="keyword">return</span> <span class="literal">0</span>;
|
|
||||||
}
|
}
|
||||||
|
<span class="keyword">return</span> <span class="literal">0</span>;
|
||||||
|
|
||||||
</pre>
|
</pre>
|
||||||
<p>
|
<p>
|
||||||
In the previous code sample, we have seen the use of the following functions from
|
In the previous code sample, we have seen the use of the following functions from
|
||||||
|
|
Loading…
Reference in a new issue