Planet
navi homePPSaboutscreenshotsdownloaddevelopmentforum

source: orxonox.OLD/trunk/src/lib/util/substring.cc @ 7366

Last change on this file since 7366 was 7325, checked in by bensch, 19 years ago

helpers

File size: 10.6 KB
RevLine 
[4597]1/*
[3941]2   orxonox - the future of 3D-vertical-scrollers
3
4   Copyright (C) 2004 orx
5
6   This program is free software; you can redistribute it and/or modify
7   it under the terms of the GNU General Public License as published by
8   the Free Software Foundation; either version 2, or (at your option)
9   any later version.
10
11   ### File Specific:
12   main-programmer: Christian Meyer
[4597]13   co-programmer: Benjamin Grauer
14
15   2005-06-10: some naming conventions
[7221]16
17//
18//  splitLine
19//  STL string tokenizer
20//
21//  Created by Clemens Wacha.
22//  Version 1.0
23//  Copyright (c) 2005 Clemens Wacha. All rights reserved.
24//
25
[4220]26*/
27
28#include "substring.h"
29
30#include <string.h>
[7221]31#include <cassert>
[4220]32
[7323]33
[7319]34/**
[7323]35 * @brief default constructor
36 */
37SubString::SubString()
38{
39}
40
41
42/**
[7319]43 * @brief create a SubString from
44 * @param string the String to Spilit
45 * @param splitter the Character at which to split string (delimiter)
46 */
[7221]47SubString::SubString(const std::string& string, char splitter)
[4220]48{
[7221]49  char split[2];
50  split[0] = splitter;
51  split[1] = '\0';
[7320]52  SubString::splitLine(this->strings, string, split);
[7221]53}
[4597]54
[7319]55
56/**
57 * @brief Splits a String into multiple splitters.
58 * @param string the String to split
59 * @param splitters multiple set of characters at what to split. (delimiters)
60 * @param escapeChar The Escape Character that overrides splitters commends and so on...
61 * @param safemode_char within these characters splitting won't happen
62 * @param comment_char the Comment character.
63 */
[7323]64SubString::SubString(const std::string& string, const std::string& splitters, char escapeChar, char safemode_char, char comment_char)
[7221]65{
[7320]66  SubString::splitLine(this->strings, string, splitters, escapeChar, safemode_char, comment_char);
[7221]67}
[4597]68
[7221]69/**
[7319]70 * @brief creates a SubSet of a SubString.
71 * @param subString the SubString to take a set from.
72 * @param subSetBegin the beginning to the end
[7221]73 */
[7319]74SubString::SubString(const SubString& subString, unsigned int subSetBegin)
75{
76  for (unsigned int i = subSetBegin; i < subString.size(); i++)
77    this->strings.push_back(subString[i]);
78}
79
80
81/**
82 * @brief creates a SubSet of a SubString.
83 * @param subString the SubString to take a Set from
84 * @param subSetBegin the beginning to the end
85 * @param subSetEnd the end of the SubSet (max subString.size() will be checked internaly)
86 */
87SubString::SubString(const SubString& subString, unsigned int subSetBegin, unsigned int subSetEnd)
88{
89  for (unsigned int i = subSetBegin; i < subString.size() || i < subSetEnd; i++)
90    this->strings.push_back(subString[i]);
91}
92
93
94/**
95 * @brief removes the object from memory
96 */
97SubString::~SubString()
98{ }
99
[7325]100/** @brief An empty String */
[7221]101const std::string SubString::emptyString = "";
[7325]102/** @brief Helper that gets you a String consisting of all White Spaces */
103const std::string SubString::WhiteSpaces = " \n\t";
104/** @brief Helper that gets you a String consisting of all WhiteSpaces and the Comma */
105const std::string SubString::WhiteSpacesWithComma = " \n\t,";
[4597]106
[7319]107/**
108 * @brief stores the Value of subString in this SubString
109 * @param subString will be copied into this String.
110 * @returns this SubString.
111 */
112SubString& SubString::operator=(const SubString& subString)
113{
114  this->strings = subString.strings;
115  return *this;
116}
[4597]117
118
[7319]119/**
120 * @brief comparator.
121 * @param subString the SubString to compare against this one.
122 * @returns true if the Stored Strings match
123 */
124bool SubString::operator==(const SubString& subString)
125{
126  return (this->strings == subString.strings);
127}
128
129
130/**
131 * @brief append operator
132 * @param subString the String to append.
133 * @returns a SubString where this and subString are appended.
134 */
135SubString SubString::operator+(const SubString& subString) const
136{
[7323]137  return SubString(*this) += subString;
[7319]138}
139
140
141/**
142 * @brief append operator.
143 * @param subString append subString to this SubString.
144 * @returns this substring appended with subString
145 */
146SubString& SubString::operator+=(const SubString& subString)
147{
148  for (unsigned int i = 0; i < subString.size(); i++)
149    this->strings.push_back(subString[i]);
[7323]150  return *this;
[7319]151}
152
153
154/**
155 * @brief Split the String at
156 * @param string where to split
157 * @param splitter delimiter.
158 */
[7221]159unsigned int SubString::split(const std::string& string, char splitter)
160{
161  this->strings.clear();
162  char split[2];
163  split[0] = splitter;
164  split[1] = '\0';
[7320]165  SubString::splitLine(this->strings, string, split);
[7221]166  return strings.size();
[4220]167}
168
[5183]169
[3941]170/**
[7319]171 * @brief Splits a String into multiple splitters.
172 * @param string the String to split
173 * @param splitters multiple set of characters at what to split. (delimiters)
174 * @param escapeChar The Escape Character that overrides splitters commends and so on...
175 * @param safemode_char within these characters splitting won't happen
176 * @param comment_char the Comment character.
177 */
[7221]178unsigned int SubString::split(const std::string& string, const std::string& splitters, char escapeChar,char safemode_char, char comment_char)
179{
180  this->strings.clear();
[7323]181  SubString::splitLine(this->strings, string, splitters, escapeChar, safemode_char, comment_char);
182  return this->strings.size();
[7221]183}
[5183]184
185
[7221]186/**
[7319]187 * @brief joins together all Strings of this Substring.
188 * @param delimiter the String between the subStrings.
189 * @returns the joined String.
190 */
191std::string SubString::join(const std::string& delimiter) const
192{
193  if (!this->strings.empty())
194  {
195    std::string retVal = this->strings[0];
[7321]196    for (unsigned int i = 1; i < this->strings.size(); i++)
[7319]197      retVal += delimiter + this->strings[i];
198    return retVal;
199  }
200  else
201    return SubString::emptyString;
202}
203
204
205/**
206 * @brief creates a SubSet of a SubString.
207 * @param subSetBegin the beginning to the end
208 * @returns the SubSet
209 *
210 * This function is added for your convenience, and does the same as
211 * SubString::SubString(const SubString& subString, unsigned int subSetBegin)
212 */
213SubString SubString::getSubSet(unsigned int subSetBegin) const
214{
215  return SubString(*this, subSetBegin);
216}
217
218
219/**
220 * @brief creates a SubSet of a SubString.
221 * @param subSetBegin the beginning to
222 * @param subSetEnd the end of the SubSet to select (if bigger than subString.size() it will be downset.)
223 * @returns the SubSet
224 *
225 * This function is added for your convenience, and does the same as
226 * SubString::SubString(const SubString& subString, unsigned int subSetBegin)
227 */
228SubString SubString::getSubSet(unsigned int subSetBegin, unsigned int subSetEnd) const
229{
230  return SubString(*this, subSetBegin, subSetEnd);
231}
232
233
234/**
[7221]235 * @brief splits line into tokens and stores them in ret.
236 * @param ret the Array, where the Splitted strings will be stored in
237 * @param offsets an Array of Offsets, here the distance from the inputstring
238 * to the beginning of the current token is stored
239 * @param line the inputLine to split
240 * @param delimiters a String of Delimiters (here the input will be splitted)
241 * @param escape_char: Escape carater (escapes splitters)
242 * @param safemode_char: the beginning of the safemode is marked with this
243 * @param comment_char: the beginning of a comment is marked with this: (until the end of a Line)
244 * @param start_state: the Initial state on how to parse the String.
245 * @returns SPLIT_LINE_STATE the parser was in when returning
246 *
[7319]247 * This is the Actual Splitting Algorithm from Clemens Wacha
[7221]248 * Supports delimiters, escape characters,
249 * ignores special  characters between safemode_char and between comment_char and linend '\n'.
250 *
251 */
[7320]252SPLIT_LINE_STATE SubString::splitLine(std::vector<std::string>& ret,
253                                      const std::string& line,
254                                      const std::string& delimiters,
255                                      char escape_char,
256                                      char safemode_char,
257                                      char comment_char,
[7221]258                                      SPLIT_LINE_STATE start_state)
259{
260  SPLIT_LINE_STATE state = start_state;
[5183]261  unsigned int i = 0;
[7221]262  std::string token;
[5183]263
[7221]264  if(start_state != SL_NORMAL && ret.size() > 0)
[5656]265  {
[7221]266    token = ret[ret.size()-1];
267    ret.pop_back();
[5656]268  }
269
[7221]270  while(i < line.size())
[5656]271  {
[7221]272    switch(state)
[5656]273    {
[7319]274      case SL_NORMAL:
275        if(line[i] == escape_char)
[7221]276        {
[7319]277          state = SL_ESCAPE;
[7221]278        }
[7319]279        else if(line[i] == safemode_char)
[7221]280        {
[7319]281          state = SL_SAFEMODE;
[7221]282        }
[7319]283        else if(line[i] == comment_char)
284        {
285          /// FINISH
286          if(token.size() > 0)
287          {
288            ret.push_back(token);
289            token.clear();
290          }
291          token += line[i];       // EAT
292          state = SL_COMMENT;
293        }
294        else if(delimiters.find(line[i]) != std::string::npos)
295        {
296          // line[i] is a delimiter
297          /// FINISH
298          if(token.size() > 0)
299          {
300            ret.push_back(token);
301            token.clear();
302          }
303        }
304        else
305        {
306          token += line[i];       // EAT
307        }
308        break;
309      case SL_ESCAPE:
310        if(line[i] == 'n') token += '\n';
311        else if(line[i] == 't') token += '\t';
312        else if(line[i] == 'v') token += '\v';
313        else if(line[i] == 'b') token += '\b';
314        else if(line[i] == 'r') token += '\r';
315        else if(line[i] == 'f') token += '\f';
316        else if(line[i] == 'a') token += '\a';
317        else if(line[i] == '?') token += '\?';
318        else token += line[i];  // EAT
[7221]319        state = SL_NORMAL;
[7319]320        break;
321      case SL_SAFEMODE:
322        if(line[i] == safemode_char)
[7221]323        {
[7319]324          state = SL_NORMAL;
[7221]325        }
[7319]326        else if(line[i] == escape_char)
327        {
328          state = SL_SAFEESCAPE;
329        }
330        else
331        {
332          token += line[i];       // EAT
333        }
334        break;
335      case SL_SAFEESCAPE:
336        if(line[i] == 'n') token += '\n';
337        else if(line[i] == 't') token += '\t';
338        else if(line[i] == 'v') token += '\v';
339        else if(line[i] == 'b') token += '\b';
340        else if(line[i] == 'r') token += '\r';
341        else if(line[i] == 'f') token += '\f';
342        else if(line[i] == 'a') token += '\a';
343        else if(line[i] == '?') token += '\?';
344        else token += line[i];  // EAT
345        state = SL_SAFEMODE;
346        break;
347      case SL_COMMENT:
348        if(line[i] == '\n')
349        {
350          /// FINISH
351          if(token.size() > 0)
352          {
353            ret.push_back(token);
354            token.clear();
355          }
356          state = SL_NORMAL;
357        }
358        else
359        {
360          token += line[i];       // EAT
361        }
362        break;
363      default:
364        // nothing
365        break;
[5656]366    }
[7221]367    i++;
[5656]368  }
369
[7221]370  /// FINISH
371  if(token.size() > 0)
[5656]372  {
[7221]373    ret.push_back(token);
374    token.clear();
[5656]375  }
[7221]376  return(state);
[5656]377}
378
[3941]379
380/**
[7319]381 * @brief Some nice debug information about this SubString
[5200]382 */
[4833]383void SubString::debug() const
384{
[7221]385  printf("Substring-information::count=%d ::", this->strings.size());
386  for (unsigned int i = 0; i < this->strings.size(); i++)
387    printf("s%d='%s'::", i, this->strings[i].c_str());
388  printf("\n");
[4833]389}
Note: See TracBrowser for help on using the repository browser.