1 | #ifndef _DATE_TIME_TIME_PARSING_HPP___ |
---|
2 | #define _DATE_TIME_TIME_PARSING_HPP___ |
---|
3 | |
---|
4 | /* Copyright (c) 2002,2003,2005 CrystalClear Software, Inc. |
---|
5 | * Use, modification and distribution is subject to the |
---|
6 | * Boost Software License, Version 1.0. (See accompanying |
---|
7 | * file LICENSE-1.0 or http://www.boost.org/LICENSE-1.0) |
---|
8 | * Author: Jeff Garland, Bart Garst |
---|
9 | * $Date: 2005/10/23 20:15:06 $ |
---|
10 | */ |
---|
11 | |
---|
12 | #include "boost/tokenizer.hpp" |
---|
13 | #include "boost/lexical_cast.hpp" |
---|
14 | #include "boost/date_time/date_parsing.hpp" |
---|
15 | #include "boost/cstdint.hpp" |
---|
16 | #include <iostream> |
---|
17 | |
---|
18 | namespace boost { |
---|
19 | namespace date_time { |
---|
20 | |
---|
21 | //! computes exponential math like 2^8 => 256, only works with positive integers |
---|
22 | //Not general purpose, but needed b/c std::pow is not available |
---|
23 | //everywehere. Hasn't been tested with negatives and zeros |
---|
24 | template<class int_type> |
---|
25 | inline |
---|
26 | int_type power(int_type base, int_type exponent) |
---|
27 | { |
---|
28 | int_type result = 1; |
---|
29 | for(int i = 0; i < exponent; ++i){ |
---|
30 | result *= base; |
---|
31 | } |
---|
32 | return result; |
---|
33 | } |
---|
34 | |
---|
35 | //! Creates a time_duration object from a delimited string |
---|
36 | /*! Expected format for string is "[-]h[h][:mm][:ss][.fff]". |
---|
37 | * If the number of fractional digits provided is greater than the |
---|
38 | * precision of the time duration type then the extra digits are |
---|
39 | * truncated. |
---|
40 | * |
---|
41 | * A negative duration will be created if the first character in |
---|
42 | * string is a '-', all other '-' will be treated as delimiters. |
---|
43 | * Accepted delimiters are "-:,.". |
---|
44 | */ |
---|
45 | template<class time_duration, class char_type> |
---|
46 | inline |
---|
47 | time_duration |
---|
48 | str_from_delimited_time_duration(const std::basic_string<char_type>& s) |
---|
49 | { |
---|
50 | unsigned short min=0, sec =0; |
---|
51 | int hour =0; |
---|
52 | bool is_neg = (s.at(0) == '-'); |
---|
53 | boost::int64_t fs=0; |
---|
54 | int pos = 0; |
---|
55 | |
---|
56 | typedef typename std::basic_string<char_type>::traits_type traits_type; |
---|
57 | typedef boost::char_separator<char_type, traits_type> char_separator_type; |
---|
58 | typedef boost::tokenizer<char_separator_type, |
---|
59 | typename std::basic_string<char_type>::const_iterator, |
---|
60 | std::basic_string<char_type> > tokenizer; |
---|
61 | typedef typename boost::tokenizer<char_separator_type, |
---|
62 | typename std::basic_string<char_type>::const_iterator, |
---|
63 | typename std::basic_string<char_type> >::iterator tokenizer_iterator; |
---|
64 | |
---|
65 | char_type sep_chars[5] = {'-',':',',','.'}; |
---|
66 | char_separator_type sep(sep_chars); |
---|
67 | tokenizer tok(s,sep); |
---|
68 | for(tokenizer_iterator beg=tok.begin(); beg!=tok.end();++beg){ |
---|
69 | switch(pos) { |
---|
70 | case 0: { |
---|
71 | hour = boost::lexical_cast<int>(*beg); |
---|
72 | break; |
---|
73 | } |
---|
74 | case 1: { |
---|
75 | min = boost::lexical_cast<unsigned short>(*beg); |
---|
76 | break; |
---|
77 | } |
---|
78 | case 2: { |
---|
79 | sec = boost::lexical_cast<unsigned short>(*beg); |
---|
80 | break; |
---|
81 | }; |
---|
82 | case 3: { |
---|
83 | int digits = static_cast<int>(beg->length()); |
---|
84 | //Works around a bug in MSVC 6 library that does not support |
---|
85 | //operator>> thus meaning lexical_cast will fail to compile. |
---|
86 | #if (defined(BOOST_MSVC) && (_MSC_VER < 1300)) |
---|
87 | // msvc wouldn't compile 'time_duration::num_fractional_digits()' |
---|
88 | // (required template argument list) as a workaround a temp |
---|
89 | // time_duration object was used |
---|
90 | time_duration td(hour,min,sec,fs); |
---|
91 | int precision = td.num_fractional_digits(); |
---|
92 | // _atoi64 is an MS specific function |
---|
93 | if(digits >= precision) { |
---|
94 | // drop excess digits |
---|
95 | fs = _atoi64(beg->substr(0, precision).c_str()); |
---|
96 | } |
---|
97 | else { |
---|
98 | fs = _atoi64(beg->c_str()); |
---|
99 | } |
---|
100 | #else |
---|
101 | int precision = time_duration::num_fractional_digits(); |
---|
102 | if(digits >= precision) { |
---|
103 | // drop excess digits |
---|
104 | fs = boost::lexical_cast<boost::int64_t>(beg->substr(0, precision)); |
---|
105 | } |
---|
106 | else { |
---|
107 | fs = boost::lexical_cast<boost::int64_t>(*beg); |
---|
108 | } |
---|
109 | #endif |
---|
110 | if(digits < precision){ |
---|
111 | // trailing zeros get dropped from the string, |
---|
112 | // "1:01:01.1" would yield .000001 instead of .100000 |
---|
113 | // the power() compensates for the missing decimal places |
---|
114 | fs *= power(10, precision - digits); |
---|
115 | } |
---|
116 | |
---|
117 | break; |
---|
118 | } |
---|
119 | }//switch |
---|
120 | pos++; |
---|
121 | } |
---|
122 | if(is_neg) { |
---|
123 | return -time_duration(hour, min, sec, fs); |
---|
124 | } |
---|
125 | else { |
---|
126 | return time_duration(hour, min, sec, fs); |
---|
127 | } |
---|
128 | } |
---|
129 | |
---|
130 | //! Creates a time_duration object from a delimited string |
---|
131 | /*! Expected format for string is "[-]h[h][:mm][:ss][.fff]". |
---|
132 | * If the number of fractional digits provided is greater than the |
---|
133 | * precision of the time duration type then the extra digits are |
---|
134 | * truncated. |
---|
135 | * |
---|
136 | * A negative duration will be created if the first character in |
---|
137 | * string is a '-', all other '-' will be treated as delimiters. |
---|
138 | * Accepted delimiters are "-:,.". |
---|
139 | */ |
---|
140 | template<class time_duration> |
---|
141 | inline |
---|
142 | time_duration |
---|
143 | parse_delimited_time_duration(const std::string& s) |
---|
144 | { |
---|
145 | return str_from_delimited_time_duration<time_duration,char>(s); |
---|
146 | } |
---|
147 | |
---|
148 | //! Utility function to split appart string |
---|
149 | inline |
---|
150 | bool |
---|
151 | split(const std::string& s, |
---|
152 | char sep, |
---|
153 | std::string& first, |
---|
154 | std::string& second) |
---|
155 | { |
---|
156 | int sep_pos = static_cast<int>(s.find(sep)); |
---|
157 | first = s.substr(0,sep_pos); |
---|
158 | second = s.substr(sep_pos+1); |
---|
159 | return true; |
---|
160 | } |
---|
161 | |
---|
162 | |
---|
163 | template<class time_type> |
---|
164 | inline |
---|
165 | time_type |
---|
166 | parse_delimited_time(const std::string& s, char sep) |
---|
167 | { |
---|
168 | typedef typename time_type::time_duration_type time_duration; |
---|
169 | typedef typename time_type::date_type date_type; |
---|
170 | |
---|
171 | //split date/time on a unique delimiter char such as ' ' or 'T' |
---|
172 | std::string date_string, tod_string; |
---|
173 | split(s, sep, date_string, tod_string); |
---|
174 | //call parse_date with first string |
---|
175 | date_type d = parse_date<date_type>(date_string); |
---|
176 | //call parse_time_duration with remaining string |
---|
177 | time_duration td = parse_delimited_time_duration<time_duration>(tod_string); |
---|
178 | //construct a time |
---|
179 | return time_type(d, td); |
---|
180 | |
---|
181 | } |
---|
182 | |
---|
183 | //! Parse time duration part of an iso time of form: [-]hhmmss[.fff...] (eg: 120259.123 is 12 hours, 2 min, 59 seconds, 123000 microseconds) |
---|
184 | template<class time_duration> |
---|
185 | inline |
---|
186 | time_duration |
---|
187 | parse_undelimited_time_duration(const std::string& s) |
---|
188 | { |
---|
189 | int precision = 0; |
---|
190 | { |
---|
191 | // msvc wouldn't compile 'time_duration::num_fractional_digits()' |
---|
192 | // (required template argument list) as a workaround, a temp |
---|
193 | // time_duration object was used |
---|
194 | time_duration tmp(0,0,0,1); |
---|
195 | precision = tmp.num_fractional_digits(); |
---|
196 | } |
---|
197 | // 'precision+1' is so we grab all digits, plus the decimal |
---|
198 | int offsets[] = {2,2,2, precision+1}; |
---|
199 | int pos = 0, sign = 0; |
---|
200 | int hours = 0; |
---|
201 | short min=0, sec=0; |
---|
202 | boost::int64_t fs=0; |
---|
203 | // increment one position if the string was "signed" |
---|
204 | if(s.at(sign) == '-') |
---|
205 | { |
---|
206 | ++sign; |
---|
207 | } |
---|
208 | // stlport choked when passing s.substr() to tokenizer |
---|
209 | // using a new string fixed the error |
---|
210 | std::string remain = s.substr(sign); |
---|
211 | /* We do not want the offset_separator to wrap the offsets, we |
---|
212 | * will never want to process more than: |
---|
213 | * 2 char, 2 char, 2 char, frac_sec length. |
---|
214 | * We *do* want the offset_separator to give us a partial for the |
---|
215 | * last characters if there were not enough provided in the input string. */ |
---|
216 | bool wrap_off = false; |
---|
217 | bool ret_part = true; |
---|
218 | boost::offset_separator osf(offsets, offsets+4, wrap_off, ret_part); |
---|
219 | typedef boost::tokenizer<boost::offset_separator, |
---|
220 | std::basic_string<char>::const_iterator, |
---|
221 | std::basic_string<char> > tokenizer; |
---|
222 | typedef boost::tokenizer<boost::offset_separator, |
---|
223 | std::basic_string<char>::const_iterator, |
---|
224 | std::basic_string<char> >::iterator tokenizer_iterator; |
---|
225 | tokenizer tok(remain, osf); |
---|
226 | for(tokenizer_iterator ti=tok.begin(); ti!=tok.end();++ti){ |
---|
227 | switch(pos) { |
---|
228 | case 0: |
---|
229 | { |
---|
230 | hours = boost::lexical_cast<int>(*ti); |
---|
231 | break; |
---|
232 | } |
---|
233 | case 1: |
---|
234 | { |
---|
235 | min = boost::lexical_cast<short>(*ti); |
---|
236 | break; |
---|
237 | } |
---|
238 | case 2: |
---|
239 | { |
---|
240 | sec = boost::lexical_cast<short>(*ti); |
---|
241 | break; |
---|
242 | } |
---|
243 | case 3: |
---|
244 | { |
---|
245 | std::string char_digits(ti->substr(1)); // digits w/no decimal |
---|
246 | int digits = static_cast<int>(char_digits.length()); |
---|
247 | |
---|
248 | //Works around a bug in MSVC 6 library that does not support |
---|
249 | //operator>> thus meaning lexical_cast will fail to compile. |
---|
250 | #if (defined(BOOST_MSVC) && (_MSC_VER <= 1200)) // 1200 == VC++ 6.0 |
---|
251 | // _atoi64 is an MS specific function |
---|
252 | if(digits >= precision) { |
---|
253 | // drop excess digits |
---|
254 | fs = _atoi64(char_digits.substr(0, precision).c_str()); |
---|
255 | } |
---|
256 | else if(digits == 0) { |
---|
257 | fs = 0; // just in case _atoi64 doesn't like an empty string |
---|
258 | } |
---|
259 | else { |
---|
260 | fs = _atoi64(char_digits.c_str()); |
---|
261 | } |
---|
262 | #else |
---|
263 | if(digits >= precision) { |
---|
264 | // drop excess digits |
---|
265 | fs = boost::lexical_cast<boost::int64_t>(char_digits.substr(0, precision)); |
---|
266 | } |
---|
267 | else if(digits == 0) { |
---|
268 | fs = 0; // lexical_cast doesn't like empty strings |
---|
269 | } |
---|
270 | else { |
---|
271 | fs = boost::lexical_cast<boost::int64_t>(char_digits); |
---|
272 | } |
---|
273 | #endif |
---|
274 | if(digits < precision){ |
---|
275 | // trailing zeros get dropped from the string, |
---|
276 | // "1:01:01.1" would yield .000001 instead of .100000 |
---|
277 | // the power() compensates for the missing decimal places |
---|
278 | fs *= power(10, precision - digits); |
---|
279 | } |
---|
280 | |
---|
281 | break; |
---|
282 | } |
---|
283 | }; |
---|
284 | pos++; |
---|
285 | } |
---|
286 | if(sign) { |
---|
287 | return -time_duration(hours, min, sec, fs); |
---|
288 | } |
---|
289 | else { |
---|
290 | return time_duration(hours, min, sec, fs); |
---|
291 | } |
---|
292 | } |
---|
293 | |
---|
294 | //! Parse time string of form YYYYMMDDThhmmss where T is delimeter between date and time |
---|
295 | template<class time_type> |
---|
296 | inline |
---|
297 | time_type |
---|
298 | parse_iso_time(const std::string& s, char sep) |
---|
299 | { |
---|
300 | typedef typename time_type::time_duration_type time_duration; |
---|
301 | typedef typename time_type::date_type date_type; |
---|
302 | |
---|
303 | //split date/time on a unique delimiter char such as ' ' or 'T' |
---|
304 | std::string date_string, tod_string; |
---|
305 | split(s, sep, date_string, tod_string); |
---|
306 | //call parse_date with first string |
---|
307 | date_type d = parse_undelimited_date<date_type>(date_string); |
---|
308 | //call parse_time_duration with remaining string |
---|
309 | time_duration td = parse_undelimited_time_duration<time_duration>(tod_string); |
---|
310 | //construct a time |
---|
311 | return time_type(d, td); |
---|
312 | } |
---|
313 | |
---|
314 | |
---|
315 | |
---|
316 | } }//namespace date_time |
---|
317 | |
---|
318 | |
---|
319 | |
---|
320 | |
---|
321 | #endif |
---|