time_parsing.hpp 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324
  1. #ifndef _DATE_TIME_TIME_PARSING_HPP___
  2. #define _DATE_TIME_TIME_PARSING_HPP___
  3. /* Copyright (c) 2002,2003,2005 CrystalClear Software, Inc.
  4. * Use, modification and distribution is subject to the
  5. * Boost Software License, Version 1.0. (See accompanying
  6. * file LICENSE_1_0.txt or http://www.boost.org/LICENSE_1_0.txt)
  7. * Author: Jeff Garland, Bart Garst
  8. * $Date$
  9. */
  10. #include "boost/tokenizer.hpp"
  11. #include "boost/lexical_cast.hpp"
  12. #include "boost/date_time/date_parsing.hpp"
  13. #include "boost/cstdint.hpp"
  14. #include <iostream>
  15. namespace boost {
  16. namespace date_time {
  17. //! computes exponential math like 2^8 => 256, only works with positive integers
  18. //Not general purpose, but needed b/c std::pow is not available
  19. //everywehere. Hasn't been tested with negatives and zeros
  20. template<class int_type>
  21. inline
  22. int_type power(int_type base, int_type exponent)
  23. {
  24. int_type result = 1;
  25. for(int i = 0; i < exponent; ++i){
  26. result *= base;
  27. }
  28. return result;
  29. }
  30. //! Creates a time_duration object from a delimited string
  31. /*! Expected format for string is "[-]h[h][:mm][:ss][.fff]".
  32. * If the number of fractional digits provided is greater than the
  33. * precision of the time duration type then the extra digits are
  34. * truncated.
  35. *
  36. * A negative duration will be created if the first character in
  37. * string is a '-', all other '-' will be treated as delimiters.
  38. * Accepted delimiters are "-:,.".
  39. */
  40. template<class time_duration, class char_type>
  41. inline
  42. time_duration
  43. str_from_delimited_time_duration(const std::basic_string<char_type>& s)
  44. {
  45. unsigned short min=0, sec =0;
  46. int hour =0;
  47. bool is_neg = (s.at(0) == '-');
  48. boost::int64_t fs=0;
  49. int pos = 0;
  50. typedef typename std::basic_string<char_type>::traits_type traits_type;
  51. typedef boost::char_separator<char_type, traits_type> char_separator_type;
  52. typedef boost::tokenizer<char_separator_type,
  53. typename std::basic_string<char_type>::const_iterator,
  54. std::basic_string<char_type> > tokenizer;
  55. typedef typename boost::tokenizer<char_separator_type,
  56. typename std::basic_string<char_type>::const_iterator,
  57. typename std::basic_string<char_type> >::iterator tokenizer_iterator;
  58. char_type sep_chars[5] = {'-',':',',','.'};
  59. char_separator_type sep(sep_chars);
  60. tokenizer tok(s,sep);
  61. for(tokenizer_iterator beg=tok.begin(); beg!=tok.end();++beg){
  62. switch(pos) {
  63. case 0: {
  64. hour = boost::lexical_cast<int>(*beg);
  65. break;
  66. }
  67. case 1: {
  68. min = boost::lexical_cast<unsigned short>(*beg);
  69. break;
  70. }
  71. case 2: {
  72. sec = boost::lexical_cast<unsigned short>(*beg);
  73. break;
  74. };
  75. case 3: {
  76. int digits = static_cast<int>(beg->length());
  77. //Works around a bug in MSVC 6 library that does not support
  78. //operator>> thus meaning lexical_cast will fail to compile.
  79. #if (defined(BOOST_MSVC) && (_MSC_VER < 1300))
  80. // msvc wouldn't compile 'time_duration::num_fractional_digits()'
  81. // (required template argument list) as a workaround a temp
  82. // time_duration object was used
  83. time_duration td(hour,min,sec,fs);
  84. int precision = td.num_fractional_digits();
  85. // _atoi64 is an MS specific function
  86. if(digits >= precision) {
  87. // drop excess digits
  88. fs = _atoi64(beg->substr(0, precision).c_str());
  89. }
  90. else {
  91. fs = _atoi64(beg->c_str());
  92. }
  93. #else
  94. int precision = time_duration::num_fractional_digits();
  95. if(digits >= precision) {
  96. // drop excess digits
  97. fs = boost::lexical_cast<boost::int64_t>(beg->substr(0, precision));
  98. }
  99. else {
  100. fs = boost::lexical_cast<boost::int64_t>(*beg);
  101. }
  102. #endif
  103. if(digits < precision){
  104. // trailing zeros get dropped from the string,
  105. // "1:01:01.1" would yield .000001 instead of .100000
  106. // the power() compensates for the missing decimal places
  107. fs *= power(10, precision - digits);
  108. }
  109. break;
  110. }
  111. default: break;
  112. }//switch
  113. pos++;
  114. }
  115. if(is_neg) {
  116. return -time_duration(hour, min, sec, fs);
  117. }
  118. else {
  119. return time_duration(hour, min, sec, fs);
  120. }
  121. }
  122. //! Creates a time_duration object from a delimited string
  123. /*! Expected format for string is "[-]h[h][:mm][:ss][.fff]".
  124. * If the number of fractional digits provided is greater than the
  125. * precision of the time duration type then the extra digits are
  126. * truncated.
  127. *
  128. * A negative duration will be created if the first character in
  129. * string is a '-', all other '-' will be treated as delimiters.
  130. * Accepted delimiters are "-:,.".
  131. */
  132. template<class time_duration>
  133. inline
  134. time_duration
  135. parse_delimited_time_duration(const std::string& s)
  136. {
  137. return str_from_delimited_time_duration<time_duration,char>(s);
  138. }
  139. //! Utility function to split appart string
  140. inline
  141. bool
  142. split(const std::string& s,
  143. char sep,
  144. std::string& first,
  145. std::string& second)
  146. {
  147. std::string::size_type sep_pos = s.find(sep);
  148. first = s.substr(0,sep_pos);
  149. if (sep_pos!=std::string::npos)
  150. second = s.substr(sep_pos+1);
  151. return true;
  152. }
  153. template<class time_type>
  154. inline
  155. time_type
  156. parse_delimited_time(const std::string& s, char sep)
  157. {
  158. typedef typename time_type::time_duration_type time_duration;
  159. typedef typename time_type::date_type date_type;
  160. //split date/time on a unique delimiter char such as ' ' or 'T'
  161. std::string date_string, tod_string;
  162. split(s, sep, date_string, tod_string);
  163. //call parse_date with first string
  164. date_type d = parse_date<date_type>(date_string);
  165. //call parse_time_duration with remaining string
  166. time_duration td = parse_delimited_time_duration<time_duration>(tod_string);
  167. //construct a time
  168. return time_type(d, td);
  169. }
  170. //! Parse time duration part of an iso time of form: [-]hhmmss[.fff...] (eg: 120259.123 is 12 hours, 2 min, 59 seconds, 123000 microseconds)
  171. template<class time_duration>
  172. inline
  173. time_duration
  174. parse_undelimited_time_duration(const std::string& s)
  175. {
  176. int precision = 0;
  177. {
  178. // msvc wouldn't compile 'time_duration::num_fractional_digits()'
  179. // (required template argument list) as a workaround, a temp
  180. // time_duration object was used
  181. time_duration tmp(0,0,0,1);
  182. precision = tmp.num_fractional_digits();
  183. }
  184. // 'precision+1' is so we grab all digits, plus the decimal
  185. int offsets[] = {2,2,2, precision+1};
  186. int pos = 0, sign = 0;
  187. int hours = 0;
  188. short min=0, sec=0;
  189. boost::int64_t fs=0;
  190. // increment one position if the string was "signed"
  191. if(s.at(sign) == '-')
  192. {
  193. ++sign;
  194. }
  195. // stlport choked when passing s.substr() to tokenizer
  196. // using a new string fixed the error
  197. std::string remain = s.substr(sign);
  198. /* We do not want the offset_separator to wrap the offsets, we
  199. * will never want to process more than:
  200. * 2 char, 2 char, 2 char, frac_sec length.
  201. * We *do* want the offset_separator to give us a partial for the
  202. * last characters if there were not enough provided in the input string. */
  203. bool wrap_off = false;
  204. bool ret_part = true;
  205. boost::offset_separator osf(offsets, offsets+4, wrap_off, ret_part);
  206. typedef boost::tokenizer<boost::offset_separator,
  207. std::basic_string<char>::const_iterator,
  208. std::basic_string<char> > tokenizer;
  209. typedef boost::tokenizer<boost::offset_separator,
  210. std::basic_string<char>::const_iterator,
  211. std::basic_string<char> >::iterator tokenizer_iterator;
  212. tokenizer tok(remain, osf);
  213. for(tokenizer_iterator ti=tok.begin(); ti!=tok.end();++ti){
  214. switch(pos) {
  215. case 0:
  216. {
  217. hours = boost::lexical_cast<int>(*ti);
  218. break;
  219. }
  220. case 1:
  221. {
  222. min = boost::lexical_cast<short>(*ti);
  223. break;
  224. }
  225. case 2:
  226. {
  227. sec = boost::lexical_cast<short>(*ti);
  228. break;
  229. }
  230. case 3:
  231. {
  232. std::string char_digits(ti->substr(1)); // digits w/no decimal
  233. int digits = static_cast<int>(char_digits.length());
  234. //Works around a bug in MSVC 6 library that does not support
  235. //operator>> thus meaning lexical_cast will fail to compile.
  236. #if (defined(BOOST_MSVC) && (_MSC_VER <= 1200)) // 1200 == VC++ 6.0
  237. // _atoi64 is an MS specific function
  238. if(digits >= precision) {
  239. // drop excess digits
  240. fs = _atoi64(char_digits.substr(0, precision).c_str());
  241. }
  242. else if(digits == 0) {
  243. fs = 0; // just in case _atoi64 doesn't like an empty string
  244. }
  245. else {
  246. fs = _atoi64(char_digits.c_str());
  247. }
  248. #else
  249. if(digits >= precision) {
  250. // drop excess digits
  251. fs = boost::lexical_cast<boost::int64_t>(char_digits.substr(0, precision));
  252. }
  253. else if(digits == 0) {
  254. fs = 0; // lexical_cast doesn't like empty strings
  255. }
  256. else {
  257. fs = boost::lexical_cast<boost::int64_t>(char_digits);
  258. }
  259. #endif
  260. if(digits < precision){
  261. // trailing zeros get dropped from the string,
  262. // "1:01:01.1" would yield .000001 instead of .100000
  263. // the power() compensates for the missing decimal places
  264. fs *= power(10, precision - digits);
  265. }
  266. break;
  267. }
  268. default: break;
  269. };
  270. pos++;
  271. }
  272. if(sign) {
  273. return -time_duration(hours, min, sec, fs);
  274. }
  275. else {
  276. return time_duration(hours, min, sec, fs);
  277. }
  278. }
  279. //! Parse time string of form YYYYMMDDThhmmss where T is delimeter between date and time
  280. template<class time_type>
  281. inline
  282. time_type
  283. parse_iso_time(const std::string& s, char sep)
  284. {
  285. typedef typename time_type::time_duration_type time_duration;
  286. typedef typename time_type::date_type date_type;
  287. //split date/time on a unique delimiter char such as ' ' or 'T'
  288. std::string date_string, tod_string;
  289. split(s, sep, date_string, tod_string);
  290. //call parse_date with first string
  291. date_type d = parse_undelimited_date<date_type>(date_string);
  292. //call parse_time_duration with remaining string
  293. time_duration td = parse_undelimited_time_duration<time_duration>(tod_string);
  294. //construct a time
  295. return time_type(d, td);
  296. }
  297. } }//namespace date_time
  298. #endif