Context Navigation

← Previous Revision
Latest Revision
Next Revision →
Normal
Revision Log

tz_db_base.hpp @ 857

Revision 857, 14.1 KB checked in by igarcia, 18 years ago (diff)

Rev	Line
[857]	1	#ifndef DATE_TIME_TZ_DB_BASE_HPP__
	2	#define DATE_TIME_TZ_DB_BASE_HPP__
	3
	4	/* Copyright (c) 2003-2004 CrystalClear Software, Inc.
	5	* Subject to the Boost Software License, Version 1.0.
	6	* (See accompanying file LICENSE-1.0 or http://www.boost.org/LICENSE-1.0)
	7	* Author: Jeff Garland, Bart Garst
	8	* $Date: 2005/05/07 08:49:15 $
	9	*/
	10
	11	#include "boost/shared_ptr.hpp"
	12	#include "boost/date_time/time_zone_names.hpp"
	13	#include "boost/date_time/time_zone_base.hpp"
	14	#include "boost/date_time/posix_time/posix_time.hpp"
	15	#include "boost/tokenizer.hpp"
	16	#include <string>
	17	#include <sstream>
	18	#include <map>
	19	#include <vector>
	20	#include <stdexcept>
	21	#include <fstream>
	22
	23	namespace boost {
	24	namespace date_time {
	25
	26
	27	struct data_not_accessible : public std::logic_error
	28	{
	29	data_not_accessible() : std::logic_error(std::string("Unable to locate or access the required datafile.")) {}
	30	data_not_accessible(const std::string& filespec) : std::logic_error(std::string("Unable to locate or access the required datafile. Filespec: " + filespec)) {}
	31	};
	32	struct bad_field_count : public std::out_of_range
	33	{
	34	bad_field_count(const std::string& s) : std::out_of_range(s) {}
	35	};
	36
	37	//! Creates a database of time_zones from csv datafile
	38	/*! The csv file containing the zone_specs used by the
	39	* tz_db_base is intended to be customized by the
	40	* library user. When customizing this file (or creating your own) the
	41	* file must follow a specific format.
	42	*
	43	* This first line is expected to contain column headings and is therefore
	44	* not processed by the tz_db_base.
	45	*
	46	* Each record (line) must have eleven fields. Some of those fields can
	47	* be empty. Every field (even empty ones) must be enclosed in
	48	* double-quotes.
	49	* Ex:
	50	* @code
	51	* "America/Phoenix" <- string enclosed in quotes
	52	* "" <- empty field
	53	* @endcode
	54	*
	55	* Some fields represent a length of time. The format of these fields
	56	* must be:
	57	* @code
	58	* "{+\|-}hh:mm[:ss]" <- length-of-time format
	59	* @endcode
	60	* Where the plus or minus is mandatory and the seconds are optional.
	61	*
	62	* Since some time zones do not use daylight savings it is not always
	63	* necessary for every field in a zone_spec to contain a value. All
	64	* zone_specs must have at least ID and GMT offset. Zones that use
	65	* daylight savings must have all fields filled except:
	66	* STD ABBR, STD NAME, DST NAME. You should take note
	67	* that DST ABBR is mandatory for zones that use daylight savings
	68	* (see field descriptions for further details).
	69	*
	70	* ***** Fields and their description/details *******
	71	*
	72	* ID:
	73	* Contains the identifying string for the zone_spec. Any string will
	74	* do as long as it's unique. No two ID's can be the same.
	75	*
	76	* STD ABBR:
	77	* STD NAME:
	78	* DST ABBR:
	79	* DST NAME:
	80	* These four are all the names and abbreviations used by the time
	81	* zone being described. While any string will do in these fields,
	82	* care should be taken. These fields hold the strings that will be
	83	* used in the output of many of the local_time classes.
	84	* Ex:
	85	* @code
	86	* time_zone nyc = tz_db.time_zone_from_region("America/New_York");
	87	* local_time ny_time(date(2004, Aug, 30), IS_DST, nyc);
	88	* cout << ny_time.to_long_string() << endl;
	89	* // 2004-Aug-30 00:00:00 Eastern Daylight Time
	90	* cout << ny_time.to_short_string() << endl;
	91	* // 2004-Aug-30 00:00:00 EDT
	92	* @endcode
	93	*
	94	* NOTE: The exact format/function names may vary - see local_time
	95	* documentation for further details.
	96	*
	97	* GMT offset:
	98	* This is the number of hours added to utc to get the local time
	99	* before any daylight savings adjustments are made. Some examples
	100	* are: America/New_York offset -5 hours, & Africa/Cairo offset +2 hours.
	101	* The format must follow the length-of-time format described above.
	102	*
	103	* DST adjustment:
	104	* The amount of time added to gmt_offset when daylight savings is in
	105	* effect. The format must follow the length-of-time format described
	106	* above.
	107	*
	108	* DST Start Date rule:
	109	* This is a specially formatted string that describes the day of year
	110	* in which the transition take place. It holds three fields of it's own,
	111	* separated by semicolons.
	112	* The first field indicates the "nth" weekday of the month. The possible
	113	* values are: 1 (first), 2 (second), 3 (third), 4 (fourth), 5 (fifth),
	114	* and -1 (last).
	115	* The second field indicates the day-of-week from 0-6 (Sun=0).
	116	* The third field indicates the month from 1-12 (Jan=1).
	117	*
	118	* Examples are: "-1;5;9"="Last Friday of September",
	119	* "2;1;3"="Second Monday of March"
	120	*
	121	* Start time:
	122	* Start time is the number of hours past midnight, on the day of the
	123	* start transition, the transition takes place. More simply put, the
	124	* time of day the transition is made (in 24 hours format). The format
	125	* must follow the length-of-time format described above with the
	126	* exception that it must always be positive.
	127	*
	128	* DST End date rule:
	129	* See DST Start date rule. The difference here is this is the day
	130	* daylight savings ends (transition to STD).
	131	*
	132	* End time:
	133	* Same as Start time.
	134	*/
	135	template<class time_zone_type, class rule_type>
	136	class tz_db_base {
	137	public:
	138	/* Having charT as a template parameter created problems
	139	* with posix_time::duration_from_string. Templatizing
	140	* duration_from_string was not possible at this time, however,
	141	* it should be possible in the future (when poor compilers get
	142	* fixed or stop being used).
	143	* Since this class was designed to use charT as a parameter it
	144	* is simply typedef'd here to ease converting in back to a
	145	* parameter the future */
	146	typedef char charT;
	147
	148	typedef typename time_zone_type::base_type time_zone_base_type;
	149	typedef typename time_zone_type::time_duration_type time_duration_type;
	150	typedef time_zone_names_base<charT> time_zone_names;
	151	typedef dst_adjustment_offsets<time_duration_type> dst_adjustment_offsets;
	152	typedef std::basic_string<charT> string_type;
	153
	154	//! Constructs an empty database
	155	tz_db_base() {}
	156
	157	//! Process csv data file, may throw exceptions
	158	/! May throw data_not_accessible, or bad_field_count exceptions /
	159	void load_from_file(const std::string& pathspec)
	160	{
	161	string_type in_str;
	162	std::string buff;
	163
	164	std::ifstream ifs(pathspec.c_str());
	165	if(!ifs){
	166	throw data_not_accessible(pathspec);
	167	}
	168	std::getline(ifs, buff); // first line is column headings
	169
	170	while( std::getline(ifs, buff)) {
	171	parse_string(buff);
	172	}
	173	}
	174
	175	//! returns true if record successfully added to map
	176	/*! Takes an id string in the form of "America/Phoenix", and a
	177	* time_zone object for that region. The id string must be a unique
	178	* name that does not already exist in the database. */
	179	bool add_record(const string_type& id,
	180	boost::shared_ptr<time_zone_base_type> tz)
	181	{
	182	typename map_type::value_type p(id, tz);
	183	return (m_zone_map.insert(p)).second;
	184	}
	185
	186	//! Returns a time_zone object built from the specs for the given region
	187	/*! Returns a time_zone object built from the specs for the given
	188	* region. If region does not exist a local_time::record_not_found
	189	* exception will be thrown */
	190	boost::shared_ptr<time_zone_base_type>
	191	time_zone_from_region(const string_type& region) const
	192	{
	193	// get the record
	194	typename map_type::const_iterator record = m_zone_map.find(region);
	195	if(record == m_zone_map.end()){
	196	return boost::shared_ptr<time_zone_base_type>(); //null pointer
	197	}
	198	return record->second;
	199	}
	200
	201	//! Returns a vector of strings holding the time zone regions in the database
	202	std::vector<std::string> region_list() const
	203	{
	204	typedef std::vector<std::string> vector_type;
	205	vector_type regions;
	206	typename map_type::const_iterator itr = m_zone_map.begin();
	207	while(itr != m_zone_map.end()) {
	208	regions.push_back(itr->first);
	209	++itr;
	210	}
	211	return regions;
	212	}
	213
	214	private:
	215	typedef std::map<string_type, boost::shared_ptr<time_zone_base_type> > map_type;
	216	map_type m_zone_map;
	217
	218	// start and end rule are of the same type
	219	typedef typename rule_type::start_rule::week_num week_num;
	220
	221	/* TODO: mechanisms need to be put in place to handle different
	222	* types of rule specs. parse_rules() only handles nth_kday
	223	* rule types. */
	224
	225	//! parses rule specs for transition day rules
	226	rule_type* parse_rules(const string_type& sr, const string_type& er) const
	227	{
	228	using namespace gregorian;
	229	// start and end rule are of the same type,
	230	// both are included here for readability
	231	typedef typename rule_type::start_rule start_rule;
	232	typedef typename rule_type::end_rule end_rule;
	233
	234	// these are: [start\|end] nth, day, month
	235	int s_nth = 0, s_d = 0, s_m = 0;
	236	int e_nth = 0, e_d = 0, e_m = 0;
	237	split_rule_spec(s_nth, s_d, s_m, sr);
	238	split_rule_spec(e_nth, e_d, e_m, er);
	239
	240	typename start_rule::week_num s_wn, e_wn;
	241	s_wn = get_week_num(s_nth);
	242	e_wn = get_week_num(e_nth);
	243
	244
	245	return new rule_type(start_rule(s_wn, s_d, s_m),
	246	end_rule(e_wn, e_d, e_m));
	247	}
	248	//! helper function for parse_rules()
	249	week_num get_week_num(int nth) const
	250	{
	251	typedef typename rule_type::start_rule start_rule;
	252	switch(nth){
	253	case 1:
	254	return start_rule::first;
	255	case 2:
	256	return start_rule::second;
	257	case 3:
	258	return start_rule::third;
	259	case 4:
	260	return start_rule::fourth;
	261	case 5:
	262	case -1:
	263	return start_rule::fifth;
	264	default:
	265	// shouldn't get here - add error handling later
	266	break;
	267	}
	268	return start_rule::fifth; // silence warnings
	269	}
	270
	271	//! splits the [start\|end]_date_rule string into 3 ints
	272	void split_rule_spec(int& nth, int& d, int& m, string_type rule) const
	273	{
	274	typedef boost::tokenizer<boost::char_separator<charT>,
	275	string_type::const_iterator,
	276	string_type > tokenizer;
	277	const charT sep_char[] = { ';', '\0'};
	278	boost::char_separator<charT> sep(sep_char);
	279	tokenizer tokens(rule, sep); // 3 fields
	280
	281	typename tokenizer::iterator tok_iter = tokens.begin();
	282	nth = std::atoi(tok_iter->c_str()); ++tok_iter;
	283	d = std::atoi(tok_iter->c_str()); ++tok_iter;
	284	m = std::atoi(tok_iter->c_str());
	285	}
	286
	287
	288	//! Take a line from the csv, turn it into a time_zone_type.
	289	/*! Take a line from the csv, turn it into a time_zone_type,
	290	* and add it to the map. Zone_specs in csv file are expected to
	291	* have eleven fields that describe the time zone. Returns true if
	292	* zone_spec successfully added to database */
	293	bool parse_string(string_type& s)
	294	{
	295
	296	std::vector<string_type> result;
	297	typedef boost::token_iterator_generator<boost::escaped_list_separator<charT>, string_type::const_iterator, string_type >::type token_iter_type;
	298
	299	token_iter_type i = boost::make_token_iterator<string_type>(s.begin(), s.end(),boost::escaped_list_separator<charT>());
	300
	301	token_iter_type end;
	302	while (i != end) {
	303	result.push_back(*i);
	304	i++;
	305	}
	306
	307	enum db_fields { ID, STDABBR, STDNAME, DSTABBR, DSTNAME, GMTOFFSET,
	308	DSTADJUST, START_DATE_RULE, START_TIME, END_DATE_RULE,
	309	END_TIME, FIELD_COUNT };
	310
	311	//take a shot at fixing gcc 4.x error
	312	const unsigned int expected_fields = static_cast<unsigned int>(FIELD_COUNT);
	313	if (result.size() != expected_fields) {
	314	std::stringstream msg;
	315	msg << "Expecting " << FIELD_COUNT << " fields, got "
	316	<< result.size() << " fields in line: " << s;
	317	throw bad_field_count(msg.str());
	318	}
	319
	320	// initializations
	321	bool has_dst = true;
	322	if(result[DSTABBR] == std::string()){
	323	has_dst = false;
	324	}
	325
	326
	327	// start building components of a time_zone
	328	time_zone_names names(result[STDNAME], result[STDABBR],
	329	result[DSTNAME], result[DSTABBR]);
	330
	331	time_duration_type utc_offset =
	332	posix_time::duration_from_string(result[GMTOFFSET]);
	333
	334	dst_adjustment_offsets adjust(time_duration_type(0,0,0),
	335	time_duration_type(0,0,0),
	336	time_duration_type(0,0,0));
	337
	338	boost::shared_ptr<rule_type> rules;
	339
	340	if(has_dst){
	341	adjust = dst_adjustment_offsets(
	342	posix_time::duration_from_string(result[DSTADJUST]),
	343	posix_time::duration_from_string(result[START_TIME]),
	344	posix_time::duration_from_string(result[END_TIME])
	345	);
	346
	347	rules =
	348	boost::shared_ptr<rule_type>(parse_rules(result[START_DATE_RULE],
	349	result[END_DATE_RULE]));
	350	}
	351	string_type id(result[ID]);
	352	boost::shared_ptr<time_zone_base_type> zone(new time_zone_type(names, utc_offset, adjust, rules));
	353	return (add_record(id, zone));
	354
	355	}
	356
	357	};
	358
	359	} } // namespace
	360
	361	#endif // DATE_TIME_TZ_DB_BASE_HPP__

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: NonGTP/Boost/boost/date_time/tz_db_base.hpp @ 857

Download in other formats: