Change find_html_comments() API to return the results
[libi2ncommon] / src / stringfunc.hxx
CommitLineData
0e23f538
TJ
1/*
2The software in this package is distributed under the GNU General
3Public License version 2 (with a special exception described below).
4
5A copy of GNU General Public License (GPL) is included in this distribution,
6in the file COPYING.GPL.
7
8As a special exception, if other files instantiate templates or use macros
9or inline functions from this file, or you compile this file and link it
10with other works to produce a work based on this file, this file
11does not by itself cause the resulting work to be covered
12by the GNU General Public License.
13
14However the source code for this file must still be made available
15in accordance with section (3) of the GNU General Public License.
16
17This exception does not invalidate any other reasons why a work based
18on this file might be covered by the GNU General Public License.
19*/
6a93d84a
TJ
20/** @file
21 * @brief collection of string tools (/ functions).
22 *
23 * contains a collection of miscellaneous functions for dealing with strings.
24 *
25 * some functions (like trim, lower case, upper case ...) are available in two versions:
26 * - a modifying one (suffix "Mod") which modifies the given string argument in place.
27 * - a non modifying one which take a constant string reference and returns a new string.
28 * .
29 *
30 *
31 * (c) Copyright 2007-2008 by Intra2net AG
6a93d84a 32 */
e93545dd
GE
33
34#ifndef __STRINGFUNC_HXX
35#define __STRINGFUNC_HXX
36
6a93d84a 37#include <list>
376ec4fa 38#include <vector>
e93545dd 39#include <string>
6a93d84a
TJ
40#include <sstream>
41#include <stdexcept>
b04b4f7e 42#include <sys/types.h>
6a93d84a 43
6ab3bc95
RP
44namespace I2n
45{
6a93d84a
TJ
46
47/*
48** some useful constants:
49*/
50
6ab3bc95
RP
51extern const std::string Whitespaces;
52extern const std::string LineEndings;
6a93d84a
TJ
53
54
55/*
56** predicates:
57*/
58
59
6ab3bc95 60bool has_prefix(const std::string& str, const std::string& prefix);
6a93d84a 61
6ab3bc95 62bool has_suffix(const std::string& str, const std::string& suffix);
6a93d84a
TJ
63
64
65/*
6ab3bc95 66** tool functions(modifying):
6a93d84a
TJ
67*/
68
6ab3bc95 69std::string trim_mod(std::string& str, const std::string& charlist = Whitespaces);
6a93d84a 70
6ab3bc95 71std::string chomp_mod(std::string& str, const std::string& what= LineEndings );
6a93d84a 72
6ab3bc95 73std::string to_lower_mod(std::string& str);
6a93d84a 74
6ab3bc95 75std::string to_upper_mod(std::string& str);
6a93d84a
TJ
76
77
78/*
79** tool functions (not modifying):
80*/
81
6ab3bc95 82std::string trim(const std::string& str, const std::string& charlist = Whitespaces);
6a93d84a 83
6ab3bc95 84std::string chomp(const std::string& str, const std::string& what= LineEndings );
6a93d84a 85
6ab3bc95 86std::string to_lower(const std::string& str);
6a93d84a 87
6ab3bc95 88std::string to_upper(const std::string& str);
6a93d84a
TJ
89
90
6ab3bc95 91std::string remove_suffix(const std::string& str, const std::string& suffix);
6a93d84a 92
6ab3bc95 93std::string remove_prefix(const std::string& str, const std::string& prefix);
6a93d84a
TJ
94
95
96
97/*
98** split and join:
99*/
100
101
6ab3bc95
RP
102bool pair_split(
103 const std::string& str,
104 std::string& key,
105 std::string& value,
106 char delimiter = '=');
6a93d84a
TJ
107
108
6ab3bc95
RP
109void split_string(
110 const std::string& str,
111 std::list< std::string >& result,
112 const std::string& delimiter= "\n",
113 bool omit_empty= false,
114 const std::string& trim_list= std::string()
6a93d84a
TJ
115);
116
6ab3bc95
RP
117std::list< std::string > split_string(
118 const std::string& str,
119 const std::string& delimiter = "\n",
120 bool omit_empty= false,
121 const std::string& trim_list= std::string()
6a93d84a
TJ
122);
123
124
6ab3bc95
RP
125std::string join_string(
126 const std::list< std::string >& parts,
127 const std::string& delimiter = "\n"
6a93d84a
TJ
128);
129
376ec4fa
CH
130std::string join_string(
131 const std::vector< std::string >& parts,
132 const std::string& delimiter = "\n"
133);
134
6a93d84a
TJ
135
136/*
137** conversions:
138*/
139
140
6ab3bc95 141std::string convert_binary_to_hex(const std::string&str, bool upper_case_digits= false);
6a93d84a 142
6ab3bc95 143std::string convert_hex_to_binary(const std::string& str) throw(std::runtime_error);
6a93d84a
TJ
144
145
6a93d84a
TJ
146/*
147** "type conversions":
148*/
149
150
151/**
152 * convert a datatype @a T to a string via string stream.
153 *
1fe2e899
CH
154 * This will not report trouble in conversion; for example:
155 * string_to<int>("christian")
156 * will return 0 and not throw an error.
157 * Use boost::lexical_cast<T>(string) to get error-checked results.
158 *
6a93d84a
TJ
159 * @param s the string which should be converted to @a T.
160 * @return the value of type T.
161 */
162template<
6ab3bc95 163class T
6a93d84a 164>
6ab3bc95 165T string_to(const std::string& s)
6a93d84a 166{
6ab3bc95
RP
167 std::istringstream istr(s);
168 T result;
169 istr >> result;
170 return result;
171} // eo string_to(const std::string&)
6a93d84a
TJ
172
173
174/**
175 * convert a datatype @a T to a string via string stream.
176 *
177 * @param s the string which should be converted to @a T.
178 * @param result the resulting value of type @a T.
179 * @return @a true iff the internal string stream was EOF after the conversion.
08f2d184
GE
180 *
181 * @attention: does not return if the conversion was successful. So check for empty strings before.
6a93d84a
TJ
182 */
183template<
6ab3bc95 184class T
6a93d84a 185>
6ab3bc95 186bool string_to(const std::string& s, T& result)
6a93d84a 187{
6ab3bc95
RP
188 std::istringstream istr(s);
189 istr >> result;
190 return istr.eof();
191} // eo string_to(const std::string&)
6a93d84a
TJ
192
193
194/**
3bcc713f
GE
195 * convert string in hexadecimal notation to a datatype @a T
196 * supports strings with and without "0x" notation, e.g. 0xff and FF are both valid
197 *
198 * @param s the hex string which should be converted to @a T.
199 * @return the value of type T.
200 */
201template<
202class T
203>
204T hex_string_to(const std::string& s)
205{
206 std::istringstream istr(s);
207 T result;
208 istr >> std::hex >> result;
209 return result;
210} // eo string_to(const std::string&)
211
212
213/**
214 * convert string in hexadecimal notation to a datatype @a T
215 * supports strings with and without "0x" notation, e.g. 0xff and FF are both valid
216 *
217 * @param s the hex string which should be converted to @a T.
218 * @param result the resulting value of type @a T.
219 * @return @a true iff the internal string stream was EOF after the conversion.
220 *
221 * @attention: does not return if the conversion was successful. So check for empty strings before.
222 */
223template<
224class T
225>
226bool hex_string_to(const std::string& s, T& result)
227{
228 std::istringstream istr(s);
229 istr >> std::hex >> result;
230 return istr.eof();
231} // eo string_to(const std::string&)
232
233
234/**
6a93d84a
TJ
235 * convert a string to another datatype @a T via string stream.
236 *
237 * @param v the value (of type @a T) which should be converted to a string.
238 * @return the resulting string.
239 */
240template<
6ab3bc95 241class T
6a93d84a 242>
6ab3bc95 243std::string to_string(const T& v)
6a93d84a 244{
6ab3bc95
RP
245 std::ostringstream ostr;
246 ostr << v;
247 return ostr.str();
248} // eo to_string(const T&)
249
250
251} // eo namespace I2n
252
6a93d84a 253
e5b21dbb 254#if 0
6ab3bc95
RP
255std::string to_lower(const std::string &src);
256std::string to_upper(const std::string &src);
e5b21dbb
RP
257#else
258// compatibility: import lower/upper funcs from I2n:
259using I2n::to_lower;
260using I2n::to_upper;
261#endif
e93545dd 262
81267544 263
8f296924
GMF
264enum UnitBase {
265 UnitBase1000, // SI decimal, composed by multiples of 1000 (KB, MB, etc.)
266 UnitBase1024 // IEC binary, composed by multiples of 1024 (KiB, MiB, etc. )
81267544
GMF
267};
268
8f296924
GMF
269enum UnitFormat {
270 ShortUnitFormat, // B, KB, MB, ...
271 LongUnitFormat // Byte, KByte, MByte, ...
d1ea9075
GMF
272};
273
81267544
GMF
274std::string nice_unit_format(
275 const int64_t input,
ee037ee3
GMF
276 const UnitFormat format = ShortUnitFormat,
277 const UnitBase base = UnitBase1024
81267544 278);
e93545dd 279
5cd64148
CH
280std::string nice_unit_format(
281 const double input,
282 const UnitFormat format = ShortUnitFormat,
283 const UnitBase base = UnitBase1024
284);
285
e93545dd
GE
286bool replace_all(std::string &base, const std::string *ist, const std::string *soll);
287bool replace_all(std::string &base, const char *ist, const char *soll);
288bool replace_all(std::string &base, const char *ist, const std::string *soll);
289bool replace_all(std::string &base, const std::string &ist, const char *soll);
290bool replace_all(std::string &base, const std::string &ist, const std::string &soll);
291
292std::string iso_to_utf8(const std::string& isostring);
293std::string utf8_to_iso(const std::string& utf8string);
13cc4db1 294std::string utf7imap_to_utf8(const std::string &utf7imapstring);
6a2b6dd1 295std::string utf8_to_utf7imap(const std::string &utf8string);
118e216e
TJ
296
297std::string strip_html_tags(const std::string &input);
298std::string smart_html_entities(const std::string &input);
299std::string html_entities(std::string str);
554f813d 300std::string html_entities_to_console(std::string str);
118e216e 301
3f5c5ccd 302typedef std::pair<std::string::size_type, std::string::size_type> CommentZone;
46dd1321 303std::vector<CommentZone> find_html_comments(const std::string &str);
3f5c5ccd
CH
304void remove_html_comments(std::string &str);
305void remove_html_comments(std::string &str, const std::vector<CommentZone> &comments);
306
b953bf36
GE
307std::string sanitize_for_logging(const std::string &str, const char replace_with='?');
308
47c07fba
GE
309std::string escape(const std::string &s);
310
311std::string descape(const std::string &s, int startpos, int &endpos);
e6da286a 312inline std::string descape(const std::string &s)
47c07fba 313{
6ab3bc95
RP
314 int endpos;
315 return descape(s,0,endpos);
47c07fba
GE
316}
317
318std::string escape_shellarg(const std::string &input);
319
e93545dd 320#endif