/* * Copyright (c) 2015, Intel Corporation * All rights reserved. * * Redistribution and use in source and binary forms, with or without modification, * are permitted provided that the following conditions are met: * * 1. Redistributions of source code must retain the above copyright notice, this * list of conditions and the following disclaimer. * * 2. Redistributions in binary form must reproduce the above copyright notice, * this list of conditions and the following disclaimer in the documentation and/or * other materials provided with the distribution. * * 3. Neither the name of the copyright holder nor the names of its contributors * may be used to endorse or promote products derived from this software without * specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include "Tokenizer.h" using std::string; using std::vector; const string Tokenizer::defaultDelimiters = " \n\r\t\v\f"; Tokenizer::Tokenizer(const string &input, const string &delimiters, bool mergeDelimiters) : _input(input), _delimiters(delimiters), _mergeDelimiters(mergeDelimiters) { } vector Tokenizer::split() { vector result; string token; bool leftover = false; for (const auto character : _input) { if (_delimiters.find(character) != string::npos) { if (_mergeDelimiters) { leftover = false; if (token.empty()) { // skip consecutive delimiters continue; } } else { // We've encountered a delimiter, which means that there is a // left-hand token and a right-side token. We are going to add // the left-hand one but must not forget that there is a // right-hand one (possibly empty) leftover = true; } result.push_back(token); token.clear(); continue; } token += character; leftover = true; } // push any leftover token: if (leftover) { result.push_back(token); } return result; }