// ----------------------------------------------------------------------
// File: StringTokenizer.hh
// Author: Andreas-Joachim Peters - CERN
// ----------------------------------------------------------------------
/************************************************************************
* EOS - the CERN Disk Storage System *
* Copyright (C) 2011 CERN/Switzerland *
* *
* This program is free software: you can redistribute it and/or modify *
* it under the terms of the GNU General Public License as published by *
* the Free Software Foundation, either version 3 of the License, or *
* (at your option) any later version. *
* *
* This program is distributed in the hope that it will be useful, *
* but WITHOUT ANY WARRANTY; without even the implied warranty of *
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
* GNU General Public License for more details. *
* *
* You should have received a copy of the GNU General Public License *
* along with this program. If not, see .*
************************************************************************/
#pragma once
#include "common/Namespace.hh"
#include "XrdOuc/XrdOucString.hh"
#include
#include
#include
#include
#include
#include "common/StringSplit.hh"
EOSCOMMONNAMESPACE_BEGIN
//------------------------------------------------------------------------------
//! Utility class with convenience functions for string command line parsing.
//!
//! Works like XrdOucTokenizer but wants each argument in " ".
//! When returned, each token will have the enclosing quotes removed.
//!
//! Additional options:
//! - Replace & with #AND# in tokens
//! - Fully unescape quotes within the token
//------------------------------------------------------------------------------
class StringTokenizer
{
char* fBuffer;
int fCurrentLine;
int fCurrentArg;
std::vector fLineStart;
std::vector fLineArgs;
public:
//----------------------------------------------------------------------------
//! Constructor
//----------------------------------------------------------------------------
StringTokenizer(const char* s);
//----------------------------------------------------------------------------
//! Constructor
//----------------------------------------------------------------------------
StringTokenizer(XrdOucString s) : StringTokenizer(s.c_str()) {}
//----------------------------------------------------------------------------
//! Constructor
//----------------------------------------------------------------------------
StringTokenizer(std::string s) : StringTokenizer(s.c_str()) {}
//----------------------------------------------------------------------------
//! Destructor
//----------------------------------------------------------------------------
~StringTokenizer();
//----------------------------------------------------------------------------
//! Get next parsed line separated by \n
//!
//! @return next line
//----------------------------------------------------------------------------
const char* GetLine();
//----------------------------------------------------------------------------
//! Return next parsed space separated token taking into account escaped
//! blanks and quoted strings.
//!
//! Note: Quotes enclosing the token are removed, but other type of quotes
//! are left untouched
//!
//! @param escapeand if true escape & with #AND# !! UGLY!!
//!
//! @return next token or null if no token found
//----------------------------------------------------------------------------
const char* GetToken(bool escapeand = true);
//----------------------------------------------------------------------------
//! Return next parsed space separated token taking into account escaped
//! blanks and quoted strings.
//!
//! Note: Quotes enclosing the token are removed, while any other
//! type of quotes will be unescaped
//!
//! @param escapeand if true escape & with #AND#
//!
//! @return next token or null if no token found
//----------------------------------------------------------------------------
const char* GetTokenUnquoted(bool escapeand = true);
//----------------------------------------------------------------------------
//! Get next token and return it in the supplied StringType.
//!
//! Note: We use the StringType template to support both
//! std::string and XrdOucString.
//!
//! @param token the next token or empty string if nothing found
//! @param escapeand if true escape & with #AND#
//!
//! @return true if token retrieved, otherwise false
//----------------------------------------------------------------------------
template
bool NextToken(StringType& token, bool escapeand = true);
//----------------------------------------------------------------------------
//! Split given string based on the delimiter
//!
//! @param str given string
//! @param delimiter delimiter
//!
//! @return vector of tokens
//----------------------------------------------------------------------------
template
static C split(std::string_view str, const char delimiter);
//----------------------------------------------------------------------------
//! Merge vector's contents using the provided delimiter
//!
//! @param container container of tokens
//! @param delimiter delimiter
//!
//! @return string obtained from concatenating the tokens using the delimiter
//----------------------------------------------------------------------------
template
static std::string merge(const C& container, const char delimiter);
//----------------------------------------------------------------------------
//! Check if string represents unsigned number - could be dropped ?!
//----------------------------------------------------------------------------
static bool IsUnsignedNumber(const std::string& str);
};
//------------------------------------------------------------------------------
// Get next token and return it in the supplied StringType
//------------------------------------------------------------------------------
template
inline bool StringTokenizer::NextToken(StringType& token, bool escapeand)
{
const char* tmp = GetToken(escapeand);
if (tmp == nullptr) {
token = "";
return false;
}
token = tmp;
return true;
}
//------------------------------------------------------------------------------
// Split given string based on the delimiter
//------------------------------------------------------------------------------
template
C StringTokenizer::split(std::string_view str, char delimiter)
{
C container;
for (std::string_view part: CharSplitIt(str, delimiter)) {
container.emplace_back(part);
}
return container;
}
//------------------------------------------------------------------------------
// Merge container's contents using the provided delimiter
//------------------------------------------------------------------------------
template
std::string
StringTokenizer::merge(const C& container, char delimiter)
{
std::ostringstream oss;
for (const auto& elem : container) {
oss << elem << delimiter;
}
std::string output = oss.str();
if (output.length()) {
output.resize(output.length() - 1);
}
return output;
}
EOSCOMMONNAMESPACE_END