Support: quest -f cjk_ngram
[xapian.git] / xapian-core / unicode / description_append.cc
blob0feeb96a731c40f8e7f1713f2530ae497997ce1c
1 /** @file description_append.cc
2 * @brief Append a string to an object description, escaping invalid UTF-8
3 */
4 /* Copyright (C) 2013 Olly Betts
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation; either version 2 of the License, or
9 * (at your option) any later version.
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
21 #include <config.h>
23 #include "description_append.h"
24 #include "xapian/unicode.h"
26 #include <cstdio>
27 #include <string>
29 using namespace std;
31 void
32 description_append(std::string & desc, const std::string &s)
34 desc.reserve(desc.size() + s.size());
35 for (Xapian::Utf8Iterator i(s); i != Xapian::Utf8Iterator(); ++i) {
36 unsigned ch = i.strict_deref();
37 if ((ch & 0x80000000) == 0 && ch >= ' ' && ch != '\\' && ch != 127) {
38 Xapian::Unicode::append_utf8(desc, ch);
39 } else {
40 char buf[8];
41 sprintf(buf, "\\x%02x", ch & 0xff);
42 desc += buf;