Chris@16: // ---------------------------------------------------------------------------- Chris@16: // parsing.hpp : implementation of the parsing member functions Chris@16: // ( parse, parse_printf_directive) Chris@16: // ---------------------------------------------------------------------------- Chris@16: Chris@16: // Copyright Samuel Krempp 2003. Use, modification, and distribution are Chris@16: // subject to the Boost Software License, Version 1.0. (See accompanying Chris@16: // file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt) Chris@16: Chris@16: // see http://www.boost.org/libs/format for library home page Chris@16: Chris@16: // ---------------------------------------------------------------------------- Chris@16: Chris@16: #ifndef BOOST_FORMAT_PARSING_HPP Chris@16: #define BOOST_FORMAT_PARSING_HPP Chris@16: Chris@16: Chris@16: #include Chris@16: #include Chris@16: #include Chris@16: #include Chris@16: Chris@16: Chris@16: namespace boost { Chris@16: namespace io { Chris@16: namespace detail { Chris@16: Chris@16: #if defined(BOOST_NO_STD_LOCALE) Chris@16: // streams will be used for narrow / widen. but these methods are not const Chris@16: template Chris@16: T& const_or_not(const T& x) { Chris@16: return const_cast (x); Chris@16: } Chris@16: #else Chris@16: template Chris@16: const T& const_or_not(const T& x) { Chris@16: return x; Chris@16: } Chris@16: #endif Chris@16: Chris@16: template inline Chris@16: char wrap_narrow(const Facet& fac, Ch c, char deflt) { Chris@16: return const_or_not(fac).narrow(c, deflt); Chris@16: } Chris@16: Chris@16: template inline Chris@16: bool wrap_isdigit(const Facet& fac, Ch c) { Chris@16: #if ! defined( BOOST_NO_LOCALE_ISDIGIT ) Chris@16: return fac.is(std::ctype::digit, c); Chris@16: # else Chris@16: (void) fac; // remove "unused parameter" warning Chris@16: using namespace std; Chris@16: return isdigit(c); Chris@16: #endif Chris@16: } Chris@16: Chris@16: template Chris@16: Iter wrap_scan_notdigit(const Facet & fac, Iter beg, Iter end) { Chris@16: using namespace std; Chris@16: for( ; beg!=end && wrap_isdigit(fac, *beg); ++beg) ; Chris@16: return beg; Chris@16: } Chris@16: Chris@16: Chris@16: // Input : [start, last) iterators range and a Chris@16: // a Facet to use its widen/narrow member function Chris@16: // Effects : read sequence and convert digits into integral n, of type Res Chris@16: // Returns : n Chris@16: template Chris@16: Iter str2int (const Iter & start, const Iter & last, Res & res, Chris@16: const Facet& fac) Chris@16: { Chris@16: using namespace std; Chris@16: Iter it; Chris@16: res=0; Chris@16: for(it=start; it != last && wrap_isdigit(fac, *it); ++it ) { Chris@16: char cur_ch = wrap_narrow(fac, *it, 0); // cant fail. Chris@16: res *= 10; Chris@16: res += cur_ch - '0'; // 22.2.1.1.2.13 of the C++ standard Chris@16: } Chris@16: return it; Chris@16: } Chris@16: Chris@16: // skip printf's "asterisk-fields" directives in the format-string buf Chris@16: // Input : char string, with starting index *pos_p Chris@16: // a Facet merely to use its widen/narrow member function Chris@16: // Effects : advance *pos_p by skipping printf's asterisk fields. Chris@16: // Returns : nothing Chris@16: template Chris@16: Iter skip_asterisk(Iter start, Iter last, const Facet& fac) Chris@16: { Chris@16: using namespace std; Chris@16: ++ start; Chris@16: start = wrap_scan_notdigit(fac, start, last); Chris@16: if(start!=last && *start== const_or_not(fac).widen( '$') ) Chris@16: ++start; Chris@16: return start; Chris@16: } Chris@16: Chris@16: Chris@16: // auxiliary func called by parse_printf_directive Chris@16: // for centralising error handling Chris@16: // it either throws if user sets the corresponding flag, or does nothing. Chris@16: inline void maybe_throw_exception(unsigned char exceptions, Chris@16: std::size_t pos, std::size_t size) Chris@16: { Chris@16: if(exceptions & io::bad_format_string_bit) Chris@16: boost::throw_exception(io::bad_format_string(pos, size) ); Chris@16: } Chris@16: Chris@16: Chris@16: // Input: the position of a printf-directive in the format-string Chris@16: // a basic_ios& merely to use its widen/narrow member function Chris@16: // a bitset'exceptions' telling whether to throw exceptions on errors. Chris@16: // Returns: Chris@16: // true if parse succeeded (ignore some errors if exceptions disabled) Chris@16: // false if it failed so bad that the directive should be printed verbatim Chris@16: // Effects: Chris@16: // start is incremented so that *start is the first char after Chris@16: // this directive Chris@16: // *fpar is set with the parameters read in the directive Chris@16: template Chris@16: bool parse_printf_directive(Iter & start, const Iter& last, Chris@16: detail::format_item * fpar, Chris@16: const Facet& fac, Chris@16: std::size_t offset, unsigned char exceptions) Chris@16: { Chris@16: typedef typename basic_format::format_item_t format_item_t; Chris@16: Chris@16: fpar->argN_ = format_item_t::argN_no_posit; // if no positional-directive Chris@16: bool precision_set = false; Chris@16: bool in_brackets=false; Chris@16: Iter start0 = start; Chris@16: std::size_t fstring_size = last-start0+offset; Chris@16: Chris@16: if(start>= last) { // empty directive : this is a trailing % Chris@16: maybe_throw_exception(exceptions, start-start0 + offset, fstring_size); Chris@16: return false; Chris@16: } Chris@16: Chris@16: if(*start== const_or_not(fac).widen( '|')) { Chris@16: in_brackets=true; Chris@16: if( ++start >= last ) { Chris@16: maybe_throw_exception(exceptions, start-start0 + offset, fstring_size); Chris@16: return false; Chris@16: } Chris@16: } Chris@16: Chris@16: // the flag '0' would be picked as a digit for argument order, but here it's a flag : Chris@16: if(*start== const_or_not(fac).widen( '0')) Chris@16: goto parse_flags; Chris@16: Chris@16: // handle argument order (%2$d) or possibly width specification: %2d Chris@16: if(wrap_isdigit(fac, *start)) { Chris@16: int n; Chris@16: start = str2int(start, last, n, fac); Chris@16: if( start >= last ) { Chris@16: maybe_throw_exception(exceptions, start-start0+offset, fstring_size); Chris@16: return false; Chris@16: } Chris@16: Chris@16: // %N% case : this is already the end of the directive Chris@16: if( *start == const_or_not(fac).widen( '%') ) { Chris@16: fpar->argN_ = n-1; Chris@16: ++start; Chris@16: if( in_brackets) Chris@16: maybe_throw_exception(exceptions, start-start0+offset, fstring_size); Chris@16: // but don't return. maybe "%" was used in lieu of '$', so we go on. Chris@16: else Chris@16: return true; Chris@16: } Chris@16: Chris@16: if ( *start== const_or_not(fac).widen( '$') ) { Chris@16: fpar->argN_ = n-1; Chris@16: ++start; Chris@16: } Chris@16: else { Chris@16: // non-positionnal directive Chris@16: fpar->fmtstate_.width_ = n; Chris@16: fpar->argN_ = format_item_t::argN_no_posit; Chris@16: goto parse_precision; Chris@16: } Chris@16: } Chris@16: Chris@16: parse_flags: Chris@16: // handle flags Chris@16: while ( start != last) { // as long as char is one of + - = _ # 0 l h or ' ' Chris@16: // misc switches Chris@16: switch ( wrap_narrow(fac, *start, 0)) { Chris@16: case '\'' : break; // no effect yet. (painful to implement) Chris@16: case 'l': Chris@16: case 'h': // short/long modifier : for printf-comaptibility (no action needed) Chris@16: break; Chris@16: case '-': Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::left; Chris@16: break; Chris@16: case '=': Chris@16: fpar->pad_scheme_ |= format_item_t::centered; Chris@16: break; Chris@16: case '_': Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::internal; Chris@16: break; Chris@16: case ' ': Chris@16: fpar->pad_scheme_ |= format_item_t::spacepad; Chris@16: break; Chris@16: case '+': Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::showpos; Chris@16: break; Chris@16: case '0': Chris@16: fpar->pad_scheme_ |= format_item_t::zeropad; Chris@16: // need to know alignment before really setting flags, Chris@16: // so just add 'zeropad' flag for now, it will be processed later. Chris@16: break; Chris@16: case '#': Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::showpoint | std::ios_base::showbase; Chris@16: break; Chris@16: default: Chris@16: goto parse_width; Chris@16: } Chris@16: ++start; Chris@16: } // loop on flag. Chris@16: Chris@16: if( start>=last) { Chris@16: maybe_throw_exception(exceptions, start-start0+offset, fstring_size); Chris@16: return true; Chris@16: } Chris@16: parse_width: Chris@16: // handle width spec Chris@16: // first skip 'asterisk fields' : *, or *N$ Chris@16: if(*start == const_or_not(fac).widen( '*') ) Chris@16: start = skip_asterisk(start, last, fac); Chris@16: if(start!=last && wrap_isdigit(fac, *start)) Chris@16: start = str2int(start, last, fpar->fmtstate_.width_, fac); Chris@16: Chris@16: parse_precision: Chris@16: if( start>= last) { Chris@16: maybe_throw_exception(exceptions, start-start0+offset, fstring_size); Chris@16: return true; Chris@16: } Chris@16: // handle precision spec Chris@16: if (*start== const_or_not(fac).widen( '.')) { Chris@16: ++start; Chris@16: if(start != last && *start == const_or_not(fac).widen( '*') ) Chris@16: start = skip_asterisk(start, last, fac); Chris@16: if(start != last && wrap_isdigit(fac, *start)) { Chris@16: start = str2int(start, last, fpar->fmtstate_.precision_, fac); Chris@16: precision_set = true; Chris@16: } Chris@16: else Chris@16: fpar->fmtstate_.precision_ =0; Chris@16: } Chris@16: Chris@16: // handle formatting-type flags : Chris@16: while( start != last && ( *start== const_or_not(fac).widen( 'l') Chris@16: || *start== const_or_not(fac).widen( 'L') Chris@16: || *start== const_or_not(fac).widen( 'h')) ) Chris@16: ++start; Chris@16: if( start>=last) { Chris@16: maybe_throw_exception(exceptions, start-start0+offset, fstring_size); Chris@16: return true; Chris@16: } Chris@16: Chris@16: if( in_brackets && *start== const_or_not(fac).widen( '|') ) { Chris@16: ++start; Chris@16: return true; Chris@16: } Chris@16: switch ( wrap_narrow(fac, *start, 0) ) { Chris@16: case 'X': Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::uppercase; Chris@16: case 'p': // pointer => set hex. Chris@16: case 'x': Chris@16: fpar->fmtstate_.flags_ &= ~std::ios_base::basefield; Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::hex; Chris@16: break; Chris@16: Chris@16: case 'o': Chris@16: fpar->fmtstate_.flags_ &= ~std::ios_base::basefield; Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::oct; Chris@16: break; Chris@16: Chris@16: case 'E': Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::uppercase; Chris@16: case 'e': Chris@16: fpar->fmtstate_.flags_ &= ~std::ios_base::floatfield; Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::scientific; Chris@16: Chris@16: fpar->fmtstate_.flags_ &= ~std::ios_base::basefield; Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::dec; Chris@16: break; Chris@16: Chris@16: case 'f': Chris@16: fpar->fmtstate_.flags_ &= ~std::ios_base::floatfield; Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::fixed; Chris@16: case 'u': Chris@16: case 'd': Chris@16: case 'i': Chris@16: fpar->fmtstate_.flags_ &= ~std::ios_base::basefield; Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::dec; Chris@16: break; Chris@16: Chris@16: case 'T': Chris@16: ++start; Chris@16: if( start >= last) Chris@16: maybe_throw_exception(exceptions, start-start0+offset, fstring_size); Chris@16: else Chris@16: fpar->fmtstate_.fill_ = *start; Chris@16: fpar->pad_scheme_ |= format_item_t::tabulation; Chris@16: fpar->argN_ = format_item_t::argN_tabulation; Chris@16: break; Chris@16: case 't': Chris@16: fpar->fmtstate_.fill_ = const_or_not(fac).widen( ' '); Chris@16: fpar->pad_scheme_ |= format_item_t::tabulation; Chris@16: fpar->argN_ = format_item_t::argN_tabulation; Chris@16: break; Chris@16: Chris@16: case 'G': Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::uppercase; Chris@16: break; Chris@16: case 'g': // 'g' conversion is default for floats. Chris@16: fpar->fmtstate_.flags_ &= ~std::ios_base::basefield; Chris@16: fpar->fmtstate_.flags_ |= std::ios_base::dec; Chris@16: Chris@16: // CLEAR all floatield flags, so stream will CHOOSE Chris@16: fpar->fmtstate_.flags_ &= ~std::ios_base::floatfield; Chris@16: break; Chris@16: Chris@16: case 'C': Chris@16: case 'c': Chris@16: fpar->truncate_ = 1; Chris@16: break; Chris@16: case 'S': Chris@16: case 's': Chris@16: if(precision_set) // handle truncation manually, with own parameter. Chris@16: fpar->truncate_ = fpar->fmtstate_.precision_; Chris@16: fpar->fmtstate_.precision_ = 6; // default stream precision. Chris@16: break; Chris@16: case 'n' : Chris@16: fpar->argN_ = format_item_t::argN_ignored; Chris@16: break; Chris@16: default: Chris@16: maybe_throw_exception(exceptions, start-start0+offset, fstring_size); Chris@16: } Chris@16: ++start; Chris@16: Chris@16: if( in_brackets ) { Chris@16: if( start != last && *start== const_or_not(fac).widen( '|') ) { Chris@16: ++start; Chris@16: return true; Chris@16: } Chris@16: else maybe_throw_exception(exceptions, start-start0+offset, fstring_size); Chris@16: } Chris@16: return true; Chris@16: } Chris@16: // -end parse_printf_directive() Chris@16: Chris@16: template Chris@16: int upper_bound_from_fstring(const String& buf, Chris@16: const typename String::value_type arg_mark, Chris@16: const Facet& fac, Chris@16: unsigned char exceptions) Chris@16: { Chris@16: // quick-parsing of the format-string to count arguments mark (arg_mark, '%') Chris@16: // returns : upper bound on the number of format items in the format strings Chris@16: using namespace boost::io; Chris@16: typename String::size_type i1=0; Chris@16: int num_items=0; Chris@16: while( (i1=buf.find(arg_mark,i1)) != String::npos ) { Chris@16: if( i1+1 >= buf.size() ) { Chris@16: if(exceptions & bad_format_string_bit) Chris@16: boost::throw_exception(bad_format_string(i1, buf.size() )); // must not end in ".. %" Chris@16: else { Chris@16: ++num_items; Chris@16: break; Chris@16: } Chris@16: } Chris@16: if(buf[i1+1] == buf[i1] ) {// escaped "%%" Chris@16: i1+=2; continue; Chris@16: } Chris@16: Chris@16: ++i1; Chris@16: // in case of %N% directives, dont count it double (wastes allocations..) : Chris@16: i1 = detail::wrap_scan_notdigit(fac, buf.begin()+i1, buf.end()) - buf.begin(); Chris@16: if( i1 < buf.size() && buf[i1] == arg_mark ) Chris@16: ++i1; Chris@16: ++num_items; Chris@16: } Chris@16: return num_items; Chris@16: } Chris@16: template inline Chris@16: void append_string(String& dst, const String& src, Chris@16: const typename String::size_type beg, Chris@16: const typename String::size_type end) { Chris@16: dst.append(src.begin()+beg, src.begin()+end); Chris@16: } Chris@16: Chris@16: } // detail namespace Chris@16: } // io namespace Chris@16: Chris@16: Chris@16: Chris@16: // ----------------------------------------------- Chris@16: // format :: parse(..) Chris@16: Chris@16: template Chris@16: basic_format& basic_format:: Chris@16: parse (const string_type& buf) { Chris@16: // parse the format-string Chris@16: using namespace std; Chris@16: #if !defined(BOOST_NO_STD_LOCALE) Chris@16: const std::ctype & fac = BOOST_USE_FACET( std::ctype, getloc()); Chris@16: #else Chris@16: io::basic_oaltstringstream fac; Chris@16: //has widen and narrow even on compilers without locale Chris@16: #endif Chris@16: Chris@16: const Ch arg_mark = io::detail::const_or_not(fac).widen( '%'); Chris@16: bool ordered_args=true; Chris@16: int max_argN=-1; Chris@16: Chris@16: // A: find upper_bound on num_items and allocates arrays Chris@16: int num_items = io::detail::upper_bound_from_fstring(buf, arg_mark, fac, exceptions()); Chris@16: make_or_reuse_data(num_items); Chris@16: Chris@16: // B: Now the real parsing of the format string : Chris@16: num_items=0; Chris@16: typename string_type::size_type i0=0, i1=0; Chris@16: typename string_type::const_iterator it; Chris@16: bool special_things=false; Chris@16: int cur_item=0; Chris@16: while( (i1=buf.find(arg_mark,i1)) != string_type::npos ) { Chris@16: string_type & piece = (cur_item==0) ? prefix_ : items_[cur_item-1].appendix_; Chris@16: if( buf[i1+1] == buf[i1] ) { // escaped mark, '%%' Chris@16: io::detail::append_string(piece, buf, i0, i1+1); Chris@16: i1+=2; i0=i1; Chris@16: continue; Chris@16: } Chris@16: BOOST_ASSERT( static_cast(cur_item) < items_.size() || cur_item==0); Chris@16: Chris@16: if(i1!=i0) { Chris@16: io::detail::append_string(piece, buf, i0, i1); Chris@16: i0=i1; Chris@16: } Chris@16: ++i1; Chris@16: it = buf.begin()+i1; Chris@16: bool parse_ok = io::detail::parse_printf_directive( Chris@16: it, buf.end(), &items_[cur_item], fac, i1, exceptions()); Chris@16: i1 = it - buf.begin(); Chris@16: if( ! parse_ok ) // the directive will be printed verbatim Chris@16: continue; Chris@16: i0=i1; Chris@16: items_[cur_item].compute_states(); // process complex options, like zeropad, into params Chris@16: Chris@16: int argN=items_[cur_item].argN_; Chris@16: if(argN == format_item_t::argN_ignored) Chris@16: continue; Chris@16: if(argN ==format_item_t::argN_no_posit) Chris@16: ordered_args=false; Chris@16: else if(argN == format_item_t::argN_tabulation) special_things=true; Chris@16: else if(argN > max_argN) max_argN = argN; Chris@16: ++num_items; Chris@16: ++cur_item; Chris@16: } // loop on %'s Chris@16: BOOST_ASSERT(cur_item == num_items); Chris@16: Chris@16: // store the final piece of string Chris@16: { Chris@16: string_type & piece = (cur_item==0) ? prefix_ : items_[cur_item-1].appendix_; Chris@16: io::detail::append_string(piece, buf, i0, buf.size()); Chris@16: } Chris@16: Chris@16: if( !ordered_args) { Chris@16: if(max_argN >= 0 ) { // dont mix positional with non-positionnal directives Chris@16: if(exceptions() & io::bad_format_string_bit) Chris@101: boost::throw_exception( Chris@101: io::bad_format_string(static_cast(max_argN), 0)); Chris@16: // else do nothing. => positionnal arguments are processed as non-positionnal Chris@16: } Chris@16: // set things like it would have been with positional directives : Chris@16: int non_ordered_items = 0; Chris@16: for(int i=0; i< num_items; ++i) Chris@16: if(items_[i].argN_ == format_item_t::argN_no_posit) { Chris@16: items_[i].argN_ = non_ordered_items; Chris@16: ++non_ordered_items; Chris@16: } Chris@16: max_argN = non_ordered_items-1; Chris@16: } Chris@16: Chris@16: // C: set some member data : Chris@16: items_.resize(num_items, format_item_t(io::detail::const_or_not(fac).widen( ' ')) ); Chris@16: Chris@16: if(special_things) style_ |= special_needs; Chris@16: num_args_ = max_argN + 1; Chris@16: if(ordered_args) style_ |= ordered; Chris@16: else style_ &= ~ordered; Chris@16: return *this; Chris@16: } Chris@16: Chris@16: } // namespace boost Chris@16: Chris@16: Chris@16: #endif // BOOST_FORMAT_PARSING_HPP