Main Page | Namespace List | Class Hierarchy | Alphabetical List | Class List | File List | Namespace Members | Class Members | File Members | Related Pages | Examples

tokenizer.h

Go to the documentation of this file.
00001 // Copyright (C) 1999-2003 Open Source Telecom Corporation. 00002 // 00003 // This program is free software; you can redistribute it and/or modify 00004 // it under the terms of the GNU General Public License as published by 00005 // the Free Software Foundation; either version 2 of the License, or 00006 // (at your option) any later version. 00007 // 00008 // This program is distributed in the hope that it will be useful, 00009 // but WITHOUT ANY WARRANTY; without even the implied warranty of 00010 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 00011 // GNU General Public License for more details. 00012 // 00013 // You should have received a copy of the GNU General Public License 00014 // along with this program; if not, write to the Free Software 00015 // Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. 00016 // 00017 // As a special exception to the GNU General Public License, permission is 00018 // granted for additional uses of the text contained in its release 00019 // of Common C++. 00020 // 00021 // The exception is that, if you link the Common C++ library with other 00022 // files to produce an executable, this does not by itself cause the 00023 // resulting executable to be covered by the GNU General Public License. 00024 // Your use of that executable is in no way restricted on account of 00025 // linking the Common C++ library code into it. 00026 // 00027 // This exception does not however invalidate any other reasons why 00028 // the executable file might be covered by the GNU General Public License. 00029 // 00030 // This exception applies only to the code released under the 00031 // name Common C++. If you copy code from other releases into a copy of 00032 // Common C++, as the General Public License permits, the exception does 00033 // not apply to the code that you add in this way. To avoid misleading 00034 // anyone as to the status of such modified files, you must delete 00035 // this exception notice from them. 00036 // 00037 // If you write modifications of your own for Common C++, it is your choice 00038 // whether to permit this exception to apply to your modifications. 00039 // If you do not wish that, delete this exception notice. 00040 00046 #ifndef CCXX_TOKENIZER_H_ 00047 #define CCXX_TOKENIZER_H_ 00048 00049 #ifndef CCXX_MISSING_H_ 00050 #include <cc++/missing.h> 00051 #endif 00052 00053 #ifndef CCXX_THREAD_H_ 00054 #include <cc++/thread.h> 00055 #endif 00056 00057 #ifdef CCXX_NAMESPACES 00058 namespace ost { 00059 #endif 00060 00104 class __EXPORT StringTokenizer { 00105 public: 00111 static const char * const SPACE; 00112 00122 // maybe move more global ? 00123 class NoSuchElementException { }; 00124 00129 class __EXPORT iterator { 00130 friend class StringTokenizer; // access our private constructors 00131 private: 00132 const StringTokenizer *myTok; // my StringTokenizer 00133 const char *start; // start of current token 00134 const char *tokEnd; // end of current token (->nxDelimiter) 00135 const char *endp; // one before next token 00136 char *token; // allocated token, if requested 00137 00138 // for initialization of the itEnd iterator 00139 iterator(const StringTokenizer &tok, const char *end) 00140 : myTok(&tok),tokEnd(0),endp(end),token(0) {} 00141 00142 iterator(const StringTokenizer &tok) 00143 : myTok(&tok),tokEnd(0),endp(myTok->str-1),token(0) { 00144 ++(*this); // init first token. 00145 } 00146 00147 public: 00148 iterator() : myTok(0),start(0),tokEnd(0),endp(0),token(0) {} 00149 00150 // see also: comment in implementation of operator++ 00151 virtual ~iterator() { if (token) *token='\0'; delete [] token; } 00152 00156 // everything, but not responsible for the allocated token. 00157 iterator(const iterator& i) : 00158 myTok(i.myTok),start(i.start),tokEnd(i.tokEnd), 00159 endp(i.endp),token(0) {} 00160 00164 // everything, but not responsible for the allocated token. 00165 iterator &operator = (const iterator &i) { 00166 myTok = i.myTok; 00167 start = i.start; endp = i.endp; tokEnd = i.tokEnd; 00168 if ( token ) 00169 delete [] token; 00170 token = 0; 00171 return *this; 00172 } 00173 00177 iterator &operator ++ () THROWS (NoSuchElementException); 00178 00187 const char* operator * () THROWS (NoSuchElementException); 00188 00195 inline char nextDelimiter() const { 00196 return (tokEnd) ? *tokEnd : '\0'; 00197 } 00198 00203 // only compare the end-position. speed. 00204 inline bool operator == (const iterator &other) const { 00205 return (endp == other.endp); 00206 } 00207 00212 // only compare the end position. speed. 00213 inline bool operator != (const iterator &other) const { 00214 return (endp != other.endp); 00215 } 00216 }; 00217 private: 00218 friend class StringTokenizer::iterator; 00219 const char *str; 00220 const char *delim; 00221 bool skipAll, trim; 00222 iterator itEnd; 00223 00224 public: 00263 StringTokenizer (const char *str, 00264 const char *delim, 00265 bool skipAllDelim = false, 00266 bool trim = false); 00267 00277 StringTokenizer (const char *s); 00278 00282 iterator begin() const { 00283 return iterator(*this); 00284 } 00285 00290 void setDelimiters (const char *d) { 00291 delim = d; 00292 } 00293 00298 iterator begin(const char *d) { 00299 delim = d; 00300 return iterator(*this); 00301 } 00302 00306 const iterator& end() const { return itEnd; } 00307 }; 00308 00309 #ifdef CCXX_NAMESPACES 00310 } 00311 #endif 00312 00313 #endif 00314

Generated on Fri Jan 21 13:36:02 2005 for GNU CommonC++ by doxygen 1.3.8