os/ossrv/ossrv_pub/boost_apis/boost/token_functions.hpp
author sl
Tue, 10 Jun 2014 14:32:02 +0200
changeset 1 260cb5ec6c19
permissions -rw-r--r--
Update contrib.
sl@0
     1
// Boost token_functions.hpp  ------------------------------------------------//
sl@0
     2
sl@0
     3
// Copyright John R. Bandela 2001. 
sl@0
     4
sl@0
     5
// Distributed under the Boost Software License, Version 1.0. (See
sl@0
     6
// accompanying file LICENSE_1_0.txt or copy at
sl@0
     7
// http://www.boost.org/LICENSE_1_0.txt)
sl@0
     8
sl@0
     9
// See http://www.boost.org/libs/tokenizer/ for documentation.
sl@0
    10
sl@0
    11
// Revision History:
sl@0
    12
// 01 Oct 2004   Joaquín M López Muñoz
sl@0
    13
//      Workaround for a problem with string::assign in msvc-stlport
sl@0
    14
// 06 Apr 2004   John Bandela
sl@0
    15
//      Fixed a bug involving using char_delimiter with a true input iterator
sl@0
    16
// 28 Nov 2003   Robert Zeh and John Bandela
sl@0
    17
//      Converted into "fast" functions that avoid using += when
sl@0
    18
//      the supplied iterator isn't an input_iterator; based on
sl@0
    19
//      some work done at Archelon and a version that was checked into
sl@0
    20
//      the boost CVS for a short period of time.
sl@0
    21
// 20 Feb 2002   John Maddock
sl@0
    22
//      Removed using namespace std declarations and added
sl@0
    23
//      workaround for BOOST_NO_STDC_NAMESPACE (the library
sl@0
    24
//      can be safely mixed with regex).
sl@0
    25
// 06 Feb 2002   Jeremy Siek
sl@0
    26
//      Added char_separator.
sl@0
    27
// 02 Feb 2002   Jeremy Siek
sl@0
    28
//      Removed tabs and a little cleanup.
sl@0
    29
sl@0
    30
sl@0
    31
#ifndef BOOST_TOKEN_FUNCTIONS_JRB120303_HPP_
sl@0
    32
#define BOOST_TOKEN_FUNCTIONS_JRB120303_HPP_
sl@0
    33
sl@0
    34
#include <vector>
sl@0
    35
#include <stdexcept>
sl@0
    36
#include <string>
sl@0
    37
#include <cctype>
sl@0
    38
#include <algorithm> // for find_if
sl@0
    39
#include <boost/config.hpp>
sl@0
    40
#include <boost/assert.hpp>
sl@0
    41
#include <boost/detail/workaround.hpp>
sl@0
    42
#include <boost/mpl/if.hpp>
sl@0
    43
sl@0
    44
//
sl@0
    45
// the following must not be macros if we are to prefix them
sl@0
    46
// with std:: (they shouldn't be macros anyway...)
sl@0
    47
//
sl@0
    48
#ifdef ispunct
sl@0
    49
#  undef ispunct
sl@0
    50
#endif
sl@0
    51
#ifdef isspace
sl@0
    52
#  undef isspace
sl@0
    53
#endif
sl@0
    54
//
sl@0
    55
// fix namespace problems:
sl@0
    56
//
sl@0
    57
#ifdef BOOST_NO_STDC_NAMESPACE
sl@0
    58
namespace std{
sl@0
    59
 using ::ispunct;
sl@0
    60
 using ::isspace;
sl@0
    61
}
sl@0
    62
#endif
sl@0
    63
sl@0
    64
namespace boost{
sl@0
    65
sl@0
    66
  //===========================================================================
sl@0
    67
  // The escaped_list_separator class. Which is a model of TokenizerFunction
sl@0
    68
  // An escaped list is a super-set of what is commonly known as a comma 
sl@0
    69
  // separated value (csv) list.It is separated into fields by a comma or 
sl@0
    70
  // other character. If the delimiting character is inside quotes, then it is
sl@0
    71
  // counted as a regular character.To allow for embedded quotes in a field,
sl@0
    72
  // there can be escape sequences using the \ much like C. 
sl@0
    73
  // The role of the comma, the quotation mark, and the escape 
sl@0
    74
  // character (backslash \), can be assigned to other characters.
sl@0
    75
sl@0
    76
  struct escaped_list_error : public std::runtime_error{
sl@0
    77
    escaped_list_error(const std::string& what_arg):std::runtime_error(what_arg) { }
sl@0
    78
  };
sl@0
    79
  
sl@0
    80
sl@0
    81
// The out of the box GCC 2.95 on cygwin does not have a char_traits class.
sl@0
    82
// MSVC does not like the following typename
sl@0
    83
#if !defined(BOOST_MSVC) || BOOST_MSVC > 1300
sl@0
    84
  template <class Char, 
sl@0
    85
    class Traits = typename std::basic_string<Char>::traits_type >
sl@0
    86
#else
sl@0
    87
  template <class Char, 
sl@0
    88
    class Traits = std::basic_string<Char>::traits_type >
sl@0
    89
#endif
sl@0
    90
  class escaped_list_separator {
sl@0
    91
sl@0
    92
  private:
sl@0
    93
    typedef std::basic_string<Char,Traits> string_type;
sl@0
    94
    struct char_eq {
sl@0
    95
      Char e_;
sl@0
    96
      char_eq(Char e):e_(e) { }
sl@0
    97
      bool operator()(Char c) {
sl@0
    98
        return Traits::eq(e_,c);
sl@0
    99
      }
sl@0
   100
    };
sl@0
   101
    string_type  escape_;
sl@0
   102
    string_type  c_;
sl@0
   103
    string_type  quote_;      
sl@0
   104
    bool last_;
sl@0
   105
sl@0
   106
    bool is_escape(Char e) {
sl@0
   107
      char_eq f(e);
sl@0
   108
      return std::find_if(escape_.begin(),escape_.end(),f)!=escape_.end();
sl@0
   109
    }
sl@0
   110
    bool is_c(Char e) {
sl@0
   111
      char_eq f(e);
sl@0
   112
      return std::find_if(c_.begin(),c_.end(),f)!=c_.end();
sl@0
   113
    }
sl@0
   114
    bool is_quote(Char e) {
sl@0
   115
      char_eq f(e);
sl@0
   116
      return std::find_if(quote_.begin(),quote_.end(),f)!=quote_.end();
sl@0
   117
    }
sl@0
   118
    template <typename iterator, typename Token>
sl@0
   119
    void do_escape(iterator& next,iterator end,Token& tok) {
sl@0
   120
      if (++next == end)
sl@0
   121
        throw escaped_list_error(std::string("cannot end with escape"));
sl@0
   122
      if (Traits::eq(*next,'n')) {
sl@0
   123
        tok+='\n';
sl@0
   124
        return;
sl@0
   125
      }
sl@0
   126
      else if (is_quote(*next)) {
sl@0
   127
        tok+=*next;
sl@0
   128
        return;
sl@0
   129
      }
sl@0
   130
      else if (is_c(*next)) {
sl@0
   131
        tok+=*next;
sl@0
   132
        return;
sl@0
   133
      }
sl@0
   134
      else if (is_escape(*next)) {
sl@0
   135
        tok+=*next;
sl@0
   136
        return;
sl@0
   137
      }
sl@0
   138
      else
sl@0
   139
        throw escaped_list_error(std::string("unknown escape sequence"));
sl@0
   140
    }
sl@0
   141
sl@0
   142
    public:
sl@0
   143
    
sl@0
   144
    explicit escaped_list_separator(Char  e = '\\',
sl@0
   145
                                    Char c = ',',Char  q = '\"')
sl@0
   146
      : escape_(1,e), c_(1,c), quote_(1,q), last_(false) { }
sl@0
   147
    
sl@0
   148
    escaped_list_separator(string_type e, string_type c, string_type q)
sl@0
   149
      : escape_(e), c_(c), quote_(q), last_(false) { }
sl@0
   150
    
sl@0
   151
    void reset() {last_=false;}
sl@0
   152
sl@0
   153
    template <typename InputIterator, typename Token>
sl@0
   154
    bool operator()(InputIterator& next,InputIterator end,Token& tok) {
sl@0
   155
      bool bInQuote = false;
sl@0
   156
      tok = Token();
sl@0
   157
      
sl@0
   158
      if (next == end) {
sl@0
   159
        if (last_) {
sl@0
   160
          last_ = false;
sl@0
   161
          return true;
sl@0
   162
        }
sl@0
   163
        else
sl@0
   164
          return false;
sl@0
   165
      }
sl@0
   166
      last_ = false;
sl@0
   167
      for (;next != end;++next) {
sl@0
   168
        if (is_escape(*next)) {
sl@0
   169
          do_escape(next,end,tok);
sl@0
   170
        }
sl@0
   171
        else if (is_c(*next)) {
sl@0
   172
          if (!bInQuote) {
sl@0
   173
            // If we are not in quote, then we are done
sl@0
   174
            ++next;
sl@0
   175
            // The last character was a c, that means there is
sl@0
   176
            // 1 more blank field
sl@0
   177
            last_ = true; 
sl@0
   178
            return true;
sl@0
   179
          }
sl@0
   180
          else tok+=*next;
sl@0
   181
        }
sl@0
   182
        else if (is_quote(*next)) {
sl@0
   183
          bInQuote=!bInQuote;
sl@0
   184
        }
sl@0
   185
        else {
sl@0
   186
          tok += *next;
sl@0
   187
        }
sl@0
   188
      }
sl@0
   189
      return true;
sl@0
   190
    }
sl@0
   191
  };
sl@0
   192
sl@0
   193
  //===========================================================================
sl@0
   194
  // The classes here are used by offset_separator and char_separator to implement
sl@0
   195
  // faster assigning of tokens using assign instead of +=
sl@0
   196
  
sl@0
   197
  namespace tokenizer_detail {
sl@0
   198
sl@0
   199
  // The assign_or_plus_equal struct contains functions that implement
sl@0
   200
  // assign, +=, and clearing based on the iterator type.  The
sl@0
   201
  // generic case does nothing for plus_equal and clearing, while
sl@0
   202
  // passing through the call for assign.
sl@0
   203
  //
sl@0
   204
  // When an input iterator is being used, the situation is reversed.
sl@0
   205
  // The assign method does nothing, plus_equal invokes operator +=,
sl@0
   206
  // and the clearing method sets the supplied token to the default
sl@0
   207
  // token constructor's result.
sl@0
   208
  //
sl@0
   209
sl@0
   210
  template<class IteratorTag>
sl@0
   211
  struct assign_or_plus_equal {
sl@0
   212
    template<class Iterator, class Token>
sl@0
   213
    static void assign(Iterator b, Iterator e, Token &t) {
sl@0
   214
sl@0
   215
#if BOOST_WORKAROUND(BOOST_MSVC, < 1300) &&\
sl@0
   216
    BOOST_WORKAROUND(__SGI_STL_PORT, < 0x500) &&\
sl@0
   217
    defined(_STLP_DEBUG) &&\
sl@0
   218
    (defined(_STLP_USE_DYNAMIC_LIB) || defined(_DLL))
sl@0
   219
    // Problem with string::assign for msvc-stlport in debug mode: the
sl@0
   220
    // linker tries to import the templatized version of this memfun,
sl@0
   221
    // which is obviously not exported.
sl@0
   222
    // See http://www.stlport.com/dcforum/DCForumID6/1763.html for details.
sl@0
   223
sl@0
   224
      t = Token();
sl@0
   225
      while(b != e) t += *b++;
sl@0
   226
#else
sl@0
   227
      t.assign(b, e);
sl@0
   228
#endif
sl@0
   229
sl@0
   230
    }
sl@0
   231
sl@0
   232
    template<class Token, class Value> 
sl@0
   233
    static void plus_equal(Token &, const Value &) {
sl@0
   234
    
sl@0
   235
  }
sl@0
   236
sl@0
   237
    // If we are doing an assign, there is no need for the
sl@0
   238
    // the clear. 
sl@0
   239
    //
sl@0
   240
    template<class Token>
sl@0
   241
    static void clear(Token &) {
sl@0
   242
sl@0
   243
    }
sl@0
   244
  };
sl@0
   245
sl@0
   246
  template <>
sl@0
   247
  struct assign_or_plus_equal<std::input_iterator_tag> {
sl@0
   248
    template<class Iterator, class Token>
sl@0
   249
    static void assign(Iterator b, Iterator e, Token &t) {
sl@0
   250
sl@0
   251
    }
sl@0
   252
    template<class Token, class Value> 
sl@0
   253
    static void plus_equal(Token &t, const Value &v) {
sl@0
   254
      t += v;
sl@0
   255
    }
sl@0
   256
    template<class Token>
sl@0
   257
    static void clear(Token &t) {
sl@0
   258
      t = Token();
sl@0
   259
    }
sl@0
   260
  };
sl@0
   261
sl@0
   262
sl@0
   263
  template<class Iterator>
sl@0
   264
  struct pointer_iterator_category{
sl@0
   265
    typedef std::random_access_iterator_tag type;
sl@0
   266
  };
sl@0
   267
sl@0
   268
sl@0
   269
  template<class Iterator>
sl@0
   270
  struct class_iterator_category{
sl@0
   271
    typedef typename Iterator::iterator_category type;
sl@0
   272
  };
sl@0
   273
sl@0
   274
sl@0
   275
sl@0
   276
  // This portably gets the iterator_tag without partial template specialization
sl@0
   277
  template<class Iterator>
sl@0
   278
    struct get_iterator_category{
sl@0
   279
    typedef typename mpl::if_<is_pointer<Iterator>,
sl@0
   280
      pointer_iterator_category<Iterator>,
sl@0
   281
      class_iterator_category<Iterator>
sl@0
   282
    >::type cat;
sl@0
   283
sl@0
   284
    typedef typename cat::type iterator_category;
sl@0
   285
  };
sl@0
   286
sl@0
   287
  
sl@0
   288
}
sl@0
   289
sl@0
   290
   
sl@0
   291
  //===========================================================================
sl@0
   292
  // The offset_separator class, which is a model of TokenizerFunction.
sl@0
   293
  // Offset breaks a string into tokens based on a range of offsets
sl@0
   294
sl@0
   295
  class offset_separator {
sl@0
   296
  private:
sl@0
   297
sl@0
   298
    std::vector<int> offsets_;
sl@0
   299
    unsigned int current_offset_;
sl@0
   300
    bool wrap_offsets_;
sl@0
   301
    bool return_partial_last_;
sl@0
   302
    
sl@0
   303
  public:
sl@0
   304
    template <typename Iter>
sl@0
   305
    offset_separator(Iter begin, Iter end, bool wrap_offsets = true,
sl@0
   306
                     bool return_partial_last = true)
sl@0
   307
      : offsets_(begin,end), current_offset_(0),
sl@0
   308
        wrap_offsets_(wrap_offsets),
sl@0
   309
        return_partial_last_(return_partial_last) { }
sl@0
   310
   
sl@0
   311
    offset_separator()
sl@0
   312
      : offsets_(1,1), current_offset_(),
sl@0
   313
        wrap_offsets_(true), return_partial_last_(true) { }
sl@0
   314
sl@0
   315
    void reset() {
sl@0
   316
      current_offset_ = 0;
sl@0
   317
    }
sl@0
   318
sl@0
   319
    template <typename InputIterator, typename Token>
sl@0
   320
    bool operator()(InputIterator& next, InputIterator end, Token& tok)
sl@0
   321
    {
sl@0
   322
      typedef tokenizer_detail::assign_or_plus_equal<
sl@0
   323
#if     !defined(BOOST_MSVC) || BOOST_MSVC > 1300
sl@0
   324
        typename
sl@0
   325
#endif
sl@0
   326
        tokenizer_detail::get_iterator_category<
sl@0
   327
        InputIterator>::iterator_category> assigner;
sl@0
   328
sl@0
   329
sl@0
   330
      BOOST_ASSERT(!offsets_.empty());
sl@0
   331
    
sl@0
   332
      assigner::clear(tok);
sl@0
   333
      InputIterator start(next);
sl@0
   334
      
sl@0
   335
      if (next == end)
sl@0
   336
        return false;
sl@0
   337
sl@0
   338
      if (current_offset_ == offsets_.size())
sl@0
   339
        if (wrap_offsets_)
sl@0
   340
          current_offset_=0;
sl@0
   341
        else
sl@0
   342
          return false;
sl@0
   343
      
sl@0
   344
      int c = offsets_[current_offset_];
sl@0
   345
      int i = 0;
sl@0
   346
      for (; i < c; ++i) {
sl@0
   347
        if (next == end)break;
sl@0
   348
        assigner::plus_equal(tok,*next++);
sl@0
   349
      }
sl@0
   350
      assigner::assign(start,next,tok);
sl@0
   351
    
sl@0
   352
      if (!return_partial_last_)
sl@0
   353
        if (i < (c-1) )
sl@0
   354
          return false;
sl@0
   355
      
sl@0
   356
      ++current_offset_;
sl@0
   357
      return true;
sl@0
   358
    }
sl@0
   359
  };
sl@0
   360
sl@0
   361
sl@0
   362
  //===========================================================================
sl@0
   363
  // The char_separator class breaks a sequence of characters into
sl@0
   364
  // tokens based on the character delimiters (very much like bad old
sl@0
   365
  // strtok). A delimiter character can either be kept or dropped. A
sl@0
   366
  // kept delimiter shows up as an output token, whereas a dropped
sl@0
   367
  // delimiter does not.
sl@0
   368
sl@0
   369
  // This class replaces the char_delimiters_separator class. The
sl@0
   370
  // constructor for the char_delimiters_separator class was too
sl@0
   371
  // confusing and needed to be deprecated. However, because of the
sl@0
   372
  // default arguments to the constructor, adding the new constructor
sl@0
   373
  // would cause ambiguity, so instead I deprecated the whole class.
sl@0
   374
  // The implementation of the class was also simplified considerably.
sl@0
   375
sl@0
   376
  enum empty_token_policy { drop_empty_tokens, keep_empty_tokens };
sl@0
   377
sl@0
   378
  // The out of the box GCC 2.95 on cygwin does not have a char_traits class.
sl@0
   379
#if !defined(BOOST_MSVC) || BOOST_MSVC > 1300
sl@0
   380
  template <typename Char, 
sl@0
   381
    typename Traits = typename std::basic_string<Char>::traits_type >
sl@0
   382
#else
sl@0
   383
  template <typename Char, 
sl@0
   384
    typename Traits = std::basic_string<Char>::traits_type >
sl@0
   385
#endif
sl@0
   386
  class char_separator
sl@0
   387
  {
sl@0
   388
    typedef std::basic_string<Char,Traits> string_type;
sl@0
   389
  public:
sl@0
   390
    explicit 
sl@0
   391
    char_separator(const Char* dropped_delims,
sl@0
   392
                   const Char* kept_delims = 0,
sl@0
   393
                   empty_token_policy empty_tokens = drop_empty_tokens)
sl@0
   394
      : m_dropped_delims(dropped_delims),
sl@0
   395
        m_use_ispunct(false),
sl@0
   396
        m_use_isspace(false),
sl@0
   397
        m_empty_tokens(empty_tokens),
sl@0
   398
        m_output_done(false)
sl@0
   399
    {
sl@0
   400
      // Borland workaround
sl@0
   401
      if (kept_delims)
sl@0
   402
        m_kept_delims = kept_delims;
sl@0
   403
    }
sl@0
   404
sl@0
   405
                // use ispunct() for kept delimiters and isspace for dropped.
sl@0
   406
    explicit
sl@0
   407
    char_separator()
sl@0
   408
      : m_use_ispunct(true), 
sl@0
   409
        m_use_isspace(true), 
sl@0
   410
        m_empty_tokens(drop_empty_tokens) { }
sl@0
   411
sl@0
   412
    void reset() { }
sl@0
   413
sl@0
   414
    template <typename InputIterator, typename Token>
sl@0
   415
    bool operator()(InputIterator& next, InputIterator end, Token& tok)
sl@0
   416
    {
sl@0
   417
      typedef tokenizer_detail::assign_or_plus_equal<
sl@0
   418
#if     !defined(BOOST_MSVC) || BOOST_MSVC > 1300
sl@0
   419
        typename
sl@0
   420
#endif
sl@0
   421
        tokenizer_detail::get_iterator_category<
sl@0
   422
        InputIterator>::iterator_category> assigner;
sl@0
   423
sl@0
   424
      assigner::clear(tok);
sl@0
   425
sl@0
   426
      // skip past all dropped_delims
sl@0
   427
      if (m_empty_tokens == drop_empty_tokens)
sl@0
   428
        for (; next != end  && is_dropped(*next); ++next)
sl@0
   429
          { }
sl@0
   430
      
sl@0
   431
      InputIterator start(next);
sl@0
   432
sl@0
   433
      if (m_empty_tokens == drop_empty_tokens) {
sl@0
   434
sl@0
   435
        if (next == end)
sl@0
   436
          return false;
sl@0
   437
sl@0
   438
sl@0
   439
        // if we are on a kept_delims move past it and stop
sl@0
   440
        if (is_kept(*next)) {
sl@0
   441
          assigner::plus_equal(tok,*next);
sl@0
   442
          ++next;
sl@0
   443
        } else
sl@0
   444
          // append all the non delim characters
sl@0
   445
          for (; next != end && !is_dropped(*next) && !is_kept(*next); ++next)
sl@0
   446
            assigner::plus_equal(tok,*next);
sl@0
   447
      } 
sl@0
   448
      else { // m_empty_tokens == keep_empty_tokens
sl@0
   449
        
sl@0
   450
        // Handle empty token at the end
sl@0
   451
        if (next == end)
sl@0
   452
          if (m_output_done == false) {
sl@0
   453
            m_output_done = true;
sl@0
   454
            assigner::assign(start,next,tok);
sl@0
   455
            return true;
sl@0
   456
          } else
sl@0
   457
            return false;
sl@0
   458
        
sl@0
   459
        if (is_kept(*next)) {
sl@0
   460
          if (m_output_done == false)
sl@0
   461
            m_output_done = true;
sl@0
   462
          else {
sl@0
   463
            assigner::plus_equal(tok,*next);
sl@0
   464
            ++next;
sl@0
   465
            m_output_done = false;
sl@0
   466
          }
sl@0
   467
        } 
sl@0
   468
        else if (m_output_done == false && is_dropped(*next)) {
sl@0
   469
          m_output_done = true;
sl@0
   470
        } 
sl@0
   471
        else {
sl@0
   472
          if (is_dropped(*next))
sl@0
   473
            start=++next;
sl@0
   474
          for (; next != end && !is_dropped(*next) && !is_kept(*next); ++next)
sl@0
   475
            assigner::plus_equal(tok,*next);
sl@0
   476
          m_output_done = true;
sl@0
   477
        }
sl@0
   478
      }
sl@0
   479
      assigner::assign(start,next,tok);
sl@0
   480
      return true;
sl@0
   481
    }
sl@0
   482
sl@0
   483
  private:
sl@0
   484
    string_type m_kept_delims;
sl@0
   485
    string_type m_dropped_delims;
sl@0
   486
    bool m_use_ispunct;
sl@0
   487
    bool m_use_isspace;
sl@0
   488
    empty_token_policy m_empty_tokens;
sl@0
   489
    bool m_output_done;
sl@0
   490
    
sl@0
   491
    bool is_kept(Char E) const
sl@0
   492
    {  
sl@0
   493
      if (m_kept_delims.length())
sl@0
   494
        return m_kept_delims.find(E) != string_type::npos;
sl@0
   495
      else if (m_use_ispunct) {
sl@0
   496
        return std::ispunct(E) != 0;
sl@0
   497
      } else
sl@0
   498
        return false;
sl@0
   499
    }
sl@0
   500
    bool is_dropped(Char E) const
sl@0
   501
    {
sl@0
   502
      if (m_dropped_delims.length())
sl@0
   503
        return m_dropped_delims.find(E) != string_type::npos;
sl@0
   504
      else if (m_use_isspace) {
sl@0
   505
        return std::isspace(E) != 0;
sl@0
   506
      } else
sl@0
   507
        return false;
sl@0
   508
    }
sl@0
   509
  };
sl@0
   510
sl@0
   511
  //===========================================================================
sl@0
   512
  // The following class is DEPRECATED, use class char_separators instead.
sl@0
   513
  //
sl@0
   514
  // The char_delimiters_separator class, which is a model of
sl@0
   515
  // TokenizerFunction.  char_delimiters_separator breaks a string
sl@0
   516
  // into tokens based on character delimiters. There are 2 types of
sl@0
   517
  // delimiters. returnable delimiters can be returned as
sl@0
   518
  // tokens. These are often punctuation. nonreturnable delimiters
sl@0
   519
  // cannot be returned as tokens. These are often whitespace
sl@0
   520
sl@0
   521
  // The out of the box GCC 2.95 on cygwin does not have a char_traits class.
sl@0
   522
#if !defined(BOOST_MSVC) || BOOST_MSVC > 1300
sl@0
   523
  template <class Char, 
sl@0
   524
    class Traits = typename std::basic_string<Char>::traits_type >
sl@0
   525
#else
sl@0
   526
  template <class Char, 
sl@0
   527
    class Traits = std::basic_string<Char>::traits_type >
sl@0
   528
#endif
sl@0
   529
  class char_delimiters_separator {
sl@0
   530
  private:  
sl@0
   531
sl@0
   532
    typedef std::basic_string<Char,Traits> string_type;
sl@0
   533
    string_type returnable_;
sl@0
   534
    string_type nonreturnable_;
sl@0
   535
    bool return_delims_;
sl@0
   536
    bool no_ispunct_;
sl@0
   537
    bool no_isspace_;
sl@0
   538
    
sl@0
   539
    bool is_ret(Char E)const
sl@0
   540
    {  
sl@0
   541
      if (returnable_.length())
sl@0
   542
        return  returnable_.find(E) != string_type::npos;
sl@0
   543
      else{
sl@0
   544
        if (no_ispunct_) {return false;}
sl@0
   545
        else{
sl@0
   546
          int r = std::ispunct(E);
sl@0
   547
          return r != 0;
sl@0
   548
        }
sl@0
   549
      }
sl@0
   550
    }
sl@0
   551
    bool is_nonret(Char E)const
sl@0
   552
    {
sl@0
   553
      if (nonreturnable_.length())
sl@0
   554
        return  nonreturnable_.find(E) != string_type::npos;
sl@0
   555
      else{
sl@0
   556
        if (no_isspace_) {return false;}
sl@0
   557
        else{
sl@0
   558
          int r = std::isspace(E);
sl@0
   559
          return r != 0;
sl@0
   560
        }
sl@0
   561
      }
sl@0
   562
    }
sl@0
   563
    
sl@0
   564
  public:
sl@0
   565
    explicit char_delimiters_separator(bool return_delims = false, 
sl@0
   566
                                       const Char* returnable = 0,
sl@0
   567
                                       const Char* nonreturnable = 0)
sl@0
   568
      : returnable_(returnable ? returnable : string_type().c_str()),
sl@0
   569
        nonreturnable_(nonreturnable ? nonreturnable:string_type().c_str()),
sl@0
   570
        return_delims_(return_delims), no_ispunct_(returnable!=0),
sl@0
   571
        no_isspace_(nonreturnable!=0) { }
sl@0
   572
    
sl@0
   573
    void reset() { }
sl@0
   574
sl@0
   575
  public:
sl@0
   576
sl@0
   577
     template <typename InputIterator, typename Token>
sl@0
   578
     bool operator()(InputIterator& next, InputIterator end,Token& tok) {
sl@0
   579
     tok = Token();
sl@0
   580
     
sl@0
   581
     // skip past all nonreturnable delims
sl@0
   582
     // skip past the returnable only if we are not returning delims
sl@0
   583
     for (;next!=end && ( is_nonret(*next) || (is_ret(*next) 
sl@0
   584
       && !return_delims_ ) );++next) { }
sl@0
   585
     
sl@0
   586
     if (next == end) {
sl@0
   587
       return false;
sl@0
   588
     }
sl@0
   589
     
sl@0
   590
     // if we are to return delims and we are one a returnable one
sl@0
   591
     // move past it and stop
sl@0
   592
     if (is_ret(*next) && return_delims_) {
sl@0
   593
       tok+=*next;
sl@0
   594
       ++next;
sl@0
   595
     }
sl@0
   596
     else
sl@0
   597
       // append all the non delim characters
sl@0
   598
       for (;next!=end && !is_nonret(*next) && !is_ret(*next);++next)
sl@0
   599
         tok+=*next;
sl@0
   600
       
sl@0
   601
       
sl@0
   602
     return true;
sl@0
   603
   }
sl@0
   604
  };
sl@0
   605
sl@0
   606
sl@0
   607
} //namespace boost
sl@0
   608
sl@0
   609
sl@0
   610
#endif 
sl@0
   611
sl@0
   612
sl@0
   613
sl@0
   614
sl@0
   615