d3/db9/_string_parser_8cpp_source.html

/*

 * StringParser.cpp

 *

 *  Created on: Jan 6, 2012

 *      Author: Ben O'Leary (benjamin.oleary@gmail.com)

 *

 *      This file is part of BOLlib, released under the

 *      GNU General Public License. Please see the accompanying

 *      README.BOLlib.txt file for a full list of files, brief documentation

 *      on how to use these classes, and further details on the license.

 */


#include "StringParser.hpp"


namespace BOL

{

  std::string const StringParser::whitespaceChars( " \t" );

  std::string const StringParser::newlineChars( "\n\r" );

  std::string const StringParser::whitespaceAndNewlineChars( " \t\n\r" );

  std::string const

  StringParser::lowercaseAlphabetChars( "abcdefghijklmnopqrstuvwxyz" );

  std::string const

  StringParser::uppercaseAlphabetChars( "ABCDEFGHIJKLMNOPQRSTUVWXYZ" );

  std::string const StringParser::digitChars( "0123456789" );


  char const StringParser::lowercaseMinusUppercase( 'a' - 'A' );


  std::string

  StringParser::intToString( int inputInt,

                             int const minimumNumberOfDigits,

                             std::string const prefixForPositiveNumbers,

                             std::string const prefixForNegativeNumbers,

                             char const paddingChar )

  /* this returns a std::string that is the ASCII version of an int in base

   * 10, prefixed with prefixForPositiveNumbers or prefixForNegativeNumbers

   * depending on whether it is positive or negative. it makes returnString

   * have at least minimumNumberOfDigits digit characters, filling it out

   * with paddingChars after

   * prefixForPositiveNumbers/prefixForNegativeNumbers

   * (e.g. intToString( 23, 4, "+", "-" ) returns "+0023").

   */

  {

    if( 0 >= minimumNumberOfDigits )

    {

      std::cout

      << std::endl

      << "BOL::warning! StringParser::intToString( "

      << inputInt << ", " << minimumNumberOfDigits << ", "

      << prefixForPositiveNumbers << ", " << prefixForNegativeNumbers

      << " ) could not fit the integer into the given size!";

      // report a warning message.

      return std::string( "please_give_a_positive_number_of_digits" );

    }

    std::string returnString( prefixForPositiveNumbers );

    if( 0 > inputInt )

    {

      returnString.assign( prefixForNegativeNumbers );

      inputInt = -inputInt;

    }

    // now the '+' or '-' or whatever is substituting has been inserted &

    // inputInt is positive semi-definite.

    std::string unpaddedIntAsString( positiveIntToString( inputInt ) );

    int numberOfZeroesToInsert( minimumNumberOfDigits

                                - (int)(unpaddedIntAsString.size()) );

    // if numberOfZeroesToInsert is negative, then the number was longer than

    // the minimum output string length specified.

    if( 0 < numberOfZeroesToInsert )

    {

      returnString.append( (size_t)numberOfZeroesToInsert,

                           paddingChar );

    }

    returnString.append( unpaddedIntAsString );

    return returnString;

  }


  std::string

  StringParser::doubleToString( double inputDouble,

                                int const numberOfMantissaDigits,

                                int const numberOfExponentDigits,

                                std::string const prefixForPositiveNumbers,

                                std::string const prefixForNegativeNumbers,

                                std::string const positiveExponentPrefix,

                                std::string const negativeExponentPrefix,

                                std::string const exponentCharacter )

  /* this returns a std::string that is the ASCII version of a double in base

   * 10, in the form specified thusly:

   * 1st character: either "-" for negative numbers, or a "+" for

   *                positive numbers (or a string to replace this character),

   * 2nd character: the 1st digit,

   * 3rd character: the decimal point,

   * then ( numberOfMantissaDigits - 1 ) digits following the

   * decimal point (so that the mantissa is numberOfMantissaDigits

   * digits plus a decimal point)

   * then "E" (or a string to replace this character)

   * then "+" or "-", depending on the sign of the exponent (or a string to

   * replace this character),

   * then the absolute value of the exponent, with preceding 0s to fill to

   * numberOfExponentDigits digit characters.

   * NaNs are returned as "NaN".

   */

  {

    if( ( 0 >= numberOfMantissaDigits )

        ||

        ( 0 >= numberOfExponentDigits ) )

    {

      std::cout

      << std::endl

      << "BOL::warning! StringParser::doubleToString( "

      << inputDouble << ", " << numberOfMantissaDigits << ", "

      << numberOfExponentDigits << ", " << prefixForPositiveNumbers << ", "

      << prefixForNegativeNumbers << ", " << positiveExponentPrefix<< ", "

      << negativeExponentPrefix<< ", " << exponentCharacter

      << " ) could not fit the double into the given size!";

      // report a warning message.

      return std::string( "please_give_a_positive_number_of_digits" );

    }

    std::string returnString( prefixForPositiveNumbers );

    double formattedMantissa( inputDouble );

    if( 0.0 > inputDouble )

    {

      returnString.assign( prefixForNegativeNumbers );

      formattedMantissa = -inputDouble;

    }

    if( 0.0 == formattedMantissa )

    {

      returnString.append( "0." );

      returnString.append( ( numberOfMantissaDigits - 1 ),

                           '0' );

      returnString.append( exponentCharacter );

      returnString.append( positiveExponentPrefix );

      returnString.append( numberOfExponentDigits,

                           '0' );

    }

    else if( 0.0 < formattedMantissa )

      // at this point any negative numbers will now be positive, so any

      // that fail this comparison should be NaN.

    {

      int tenToDigitsMinusOneAsInt( 1 );

      for( int mantissaDigitCount( 1 );

           numberOfMantissaDigits > mantissaDigitCount;

           ++mantissaDigitCount )

      {

        tenToDigitsMinusOneAsInt *= 10;

      }

      double tenToDigitsMinusOneAsDouble( (double)tenToDigitsMinusOneAsInt );

      double tenToDigits( 10.0 * tenToDigitsMinusOneAsDouble );

      int formattedExponent( 0 );

      while( tenToDigits <= formattedMantissa )

      {

        formattedMantissa *= 0.1;

        ++formattedExponent;

      }

      while( tenToDigitsMinusOneAsDouble > formattedMantissa )

      {

        formattedMantissa *= 10.0;

        --formattedExponent;

      }

      /* now formattedMantissa is between tenToDigitsMinusOneAsDouble &

       * tenToDigits, & hence has numberOfMantissaCharacters digits before the

       * decimal point. however, now we have to round correctly:

       */

      int mantissaTimesTenToSomePowerAsInt( (int)formattedMantissa );

      if( 0.5 <= ( formattedMantissa

                   - (double)mantissaTimesTenToSomePowerAsInt ) )

      {

        ++mantissaTimesTenToSomePowerAsInt;

      }

      if( mantissaTimesTenToSomePowerAsInt

          >= ( 10 * tenToDigitsMinusOneAsInt) )

        // if rounding pushed mantissaTimesTenToSomePowerAsInt into having too

        // many digits...

      {

        mantissaTimesTenToSomePowerAsInt

        = ( mantissaTimesTenToSomePowerAsInt / 10 );

        ++formattedExponent;

      }

      std::string mantissaTimesTenToSomePowerAsString( positiveIntToString(

                                          mantissaTimesTenToSomePowerAsInt ) );

      returnString.append( 1,

                           mantissaTimesTenToSomePowerAsString[ 0 ] );

      returnString.append( 1,

                           '.' );

      returnString.append( mantissaTimesTenToSomePowerAsString,

                           1,

                          ( mantissaTimesTenToSomePowerAsString.size() - 1 ) );

      formattedExponent += ( numberOfMantissaDigits - 1 );

      // this accounts for all the multiplication to get the mantissa as an

      // int of the appropriate length.

      returnString.append( exponentCharacter );

      if( 0 > formattedExponent )

      {

        returnString.append( negativeExponentPrefix );

        formattedExponent = -formattedExponent;

      }

      else

      {

        returnString.append( positiveExponentPrefix );

      }

      std::string

      exponentIntAsString( positiveIntToString( formattedExponent ) );

      int exponentZeroesToPrepend( numberOfExponentDigits

                                   - (int)(exponentIntAsString.size()) );

      if( 0 < exponentZeroesToPrepend )

      {

        returnString.append( exponentZeroesToPrepend,

                             '0' );

      }

      returnString.append( exponentIntAsString );

    }

    else

      // if it failed the comparison, it should be a NaN.

    {

      returnString.assign( UsefulStuff::nanString );

    }

    return returnString;

  }


  bool

  StringParser::stringsMatchIgnoringCase( std::string const& firstString,

                                          std::string const& secondString )

  // this returns true if both strings would be identical if all their

  // uppercase chars were converted to lowercase.

  {

    if( firstString.size() != secondString.size() )

      // if the strings don't match in size, they obviously do not match.

    {

      return false;

    }

    for( int charCounter( firstString.size() - 1 );

         0 <= charCounter ;

         --charCounter )

      // go through each character in the string:

    {

      // if the strings do not match at this char, check to see if they are

      // letters that just differ in case:

      if( ( secondString[ charCounter ] != firstString[ charCounter ] )

          &&

          !( ( firstString[ charCounter ] >= 'A' )

             &&

             ( firstString[ charCounter ] <= 'Z' )

             &&

             ( secondString[ charCounter ]

               == ( firstString[ charCounter ]

                    + lowercaseMinusUppercase ) ) )

          &&

          !( ( firstString[ charCounter ] >= 'a' )

             &&

             ( firstString[ charCounter ] <= 'z' )

             &&

             ( secondString[ charCounter ]

               == ( firstString[ charCounter ]

                    - lowercaseMinusUppercase ) ) ) )

      {

        return false;

      }

    }

    // if this point is reached, all the characters matched:

    return true;

  }


  bool

  StringParser::stringIsDouble( std::string const& stringToInterpret,

                                double& doubleToSet )

  /* this returns true if stringToInterpret is a floating-point number in

   * scientific E notation (allowing 'E' or 'e'), and sets doubleToSet

   * accordingly if so.

   */

  {

    size_t charPosition( stringToInterpret.find_first_not_of(

                                                 whitespaceAndNewlineChars ) );

    if( charPosition == std::string::npos )

    {

      return false;

    }

    if( ( stringToInterpret[ charPosition ] == '+' )

        ||

        ( stringToInterpret[ charPosition ] == '-' ) )

    {

      if( charPosition == ( stringToInterpret.size() - 1 ) )

      {

        return false;

      }

      ++charPosition;

    }

    charPosition = stringToInterpret.find_first_not_of( digitChars,

                                                        charPosition );

    if( ( charPosition != std::string::npos )

        &&

        ( stringToInterpret[ charPosition ] == '.' ) )

    {

      charPosition = stringToInterpret.find_first_not_of( digitChars,

                                                        ( charPosition + 1 ) );

    }

    if( ( charPosition < ( stringToInterpret.size() - 2 ) )

        &&

        ( ( stringToInterpret[ charPosition ] == 'e' )

          ||

          ( stringToInterpret[ charPosition ] == 'E' ) ) )

    {

      ++charPosition;

      if( ( stringToInterpret[ charPosition ] == '+' )

          ||

          ( stringToInterpret[ charPosition ] == '-' ) )

      {

        ++charPosition;

      }

      charPosition = stringToInterpret.find_first_not_of( digitChars,

                                                          charPosition );

    }

    charPosition

    = stringToInterpret.find_first_not_of( whitespaceAndNewlineChars,

                                           charPosition );

    if( charPosition == std::string::npos )

    {

      doubleToSet = stringToDouble( stringToInterpret );

      return true;

    }

    return false;

  }


  std::vector< int >

  StringParser::stringToIntVector( std::string stringToInterpret )

  {

    substituteCharacterWith( stringToInterpret,

                             ',',

                             ' ' );

    substituteCharacterWith( stringToInterpret,

                             ';',

                             ' ' );

    std::vector< int > returnVector;

    std::string indicesString( trimFromFrontAndBack( stringToInterpret,

                                                 whitespaceAndNewlineChars ) );

    if( !(indicesString.empty()) )

    {

      std::stringstream streamToParse( indicesString );

      double parsedIntAsDouble;

      while( streamToParse.good() )

      {

        streamToParse >> parsedIntAsDouble;

        returnVector.push_back( (int)parsedIntAsDouble );

      }

    }

    return returnVector;

  }


  std::string

  StringParser::substringToFirst( std::string const& stringToParse,

                   VectorlikeArray< std::string > const& delimitersOfSubstring,

                                  std::string* const remainderString )

  /* this returns the substring of stringToParse from its beginning up to the

   * first instance of any of the strings in delimitersOfSubstring within

   * stringToParse. if stringToParse does not contain any of those strings as

   * a substring, the whole of stringToParse is returned, otherwise the

   * substring up to but not including the first of any found strings from

   * delimitersOfSubstring is returned. if remainderString is not NULL, the

   * remainder of stringToParse that is not returned is put into

   * remainderString.

   */

  {

    size_t

    delimiterPosition( stringToParse.find( delimitersOfSubstring[ 0 ] ) );

    size_t comparisonPosition;

    for( int stringIndex( delimitersOfSubstring.getLastIndex() );

         0 < stringIndex;

         --stringIndex )

    {

      comparisonPosition

      = stringToParse.find( delimitersOfSubstring[ stringIndex ] );

      if( comparisonPosition < delimiterPosition )

      {

        delimiterPosition = comparisonPosition;

      }

    }


    // now delimiterPosition marks the position of the first of any of the

    // strings in delimitersOfSubstring which were found in stringToParse.

    if( std::string::npos == delimiterPosition )

    {

      if( NULL != remainderString )

      {

        remainderString->assign( "" );

      }

      return stringToParse;

    }

    else

    {

      std::string returnString( stringToParse.begin(),

                               ( stringToParse.begin() + delimiterPosition ) );

      if( NULL != remainderString )

      {

        remainderString->assign( ( stringToParse.begin() + delimiterPosition ),

                                 stringToParse.end() );

      }

      return returnString;

    }

  }


  std::string

  StringParser::firstWordOf( std::string const& stringToParse,

                             std::string* const remainderString,

                             std::string const& separatorChars )

  /* this parses the first substring without any of the characters in

   * separatorChars & returns it, filling remainderString with the rest if

   * it is not NULL.

   */

  {

    size_t wordStart( stringToParse.find_first_not_of( separatorChars ) );

    if( std::string::npos == wordStart )

    {

      if( NULL != remainderString )

      {

        remainderString->assign( "" );

      }

      return std::string( "" );

    }

    else

    {

      size_t wordEnd( stringToParse.find_first_of( separatorChars,

                                                   wordStart ) );

      std::string returnString( stringToParse.substr( wordStart,

                                                   ( wordEnd - wordStart ) ) );

      if( NULL != remainderString )

      {

        wordStart = stringToParse.find_first_not_of( separatorChars,

                                                     wordEnd );

        if( std::string::npos != wordStart )

        {

          remainderString->assign( stringToParse.substr( wordStart ) );

        }

        else

        {

          remainderString->assign( "" );

        }

      }

      return returnString;

    }

  }


  StringParser::StringParser( int const minimumNumberOfDigitsForInts,

                              char const paddingCharForInts,

                              int const numberOfMantissaDigits,

                              int const numberOfExponentDigits,

                              std::string const prefixForPositiveNumbers,

                              std::string const prefixForNegativeNumbers,

                              std::string const positiveExponentPrefix,

                              std::string const negativeExponentPrefix,

                              std::string const exponentCharacter ) :

      minimumNumberOfDigitsForInts( minimumNumberOfDigitsForInts ),

      paddingCharForInts( paddingCharForInts ),

      numberOfMantissaDigits( numberOfMantissaDigits ),

      numberOfExponentDigits( numberOfExponentDigits ),

      prefixForPositiveNumbers( prefixForPositiveNumbers ),

      prefixForNegativeNumbers( prefixForNegativeNumbers ),

      positiveExponentPrefix( positiveExponentPrefix ),

      negativeExponentPrefix( negativeExponentPrefix ),

      exponentCharacter( exponentCharacter )

  {

    // just an initialization list.

  }


  StringParser::~StringParser()

  {

    // does nothing.

  }


  char

  StringParser::charForSingleDigit( int const singleDigitAsInt )

  {

    switch( singleDigitAsInt )

    {

      case 0:

        return '0';

      case 1:

        return '1';

      case 2:

        return '2';

      case 3:

        return '3';

      case 4:

        return '4';

      case 5:

        return '5';

      case 6:

        return '6';

      case 7:

        return '7';

      case 8:

        return '8';

      case 9:

        return '9';

      default:

        return '?';

    }

  }


  int

  StringParser::intForSingleDigit( char const singleDigitAsChar )

  {

    switch( singleDigitAsChar )

    {

      case '0':

        return 0;

      case '1':

        return 1;

      case '2':

        return 2;

      case '3':

        return 3;

      case '4':

        return 4;

      case '5':

        return 5;

      case '6':

        return 6;

      case '7':

        return 7;

      case '8':

        return 8;

      case '9':

        return 9;

      case 'A':

        return 10;

      case 'B':

        return 11;

      case 'C':

        return 12;

      case 'D':

        return 13;

      case 'E':

        return 14;

      case 'F':

        return 15;

      default:

        return (int)(UsefulStuff::notANumber);

    }

  }


  std::string

  StringParser::positiveIntToString( int positiveInt )

  // this puts the digits of positiveInt into digitBuffer in the order of

  // digit for highest power of 10 1st.

  {

    int numberOfDigits( 1 );

    int tenToNumberOfDigits( 10 );

    while( positiveInt >= tenToNumberOfDigits )

    {

      tenToNumberOfDigits *= 10;

      ++numberOfDigits;

    }

    std::string digitBuffer( "" );

    int digitInt;

    while( 0 < positiveInt )

    {

      tenToNumberOfDigits = ( tenToNumberOfDigits / 10 );

      digitInt = 0;

      while( tenToNumberOfDigits <= positiveInt )

      {

        positiveInt -= tenToNumberOfDigits;

        ++digitInt;

      }

      digitBuffer.push_back( charForSingleDigit( digitInt ) );

    }

    for( int zeroesToPushBack( numberOfDigits - digitBuffer.size() );

         0 < zeroesToPushBack;

         --zeroesToPushBack )

    {

      digitBuffer.push_back( '0' );

    }

    return digitBuffer;

  }


}

StringParser.hpp

BOL::StringParser::prefixForPositiveNumbers
std::string prefixForPositiveNumbers
Definition: StringParser.hpp:277

BOL::StringParser::StringParser
StringParser(int const minimumNumberOfDigitsForInts=6, char const paddingCharForInts='0', int const numberOfMantissaDigits=6, int const numberOfExponentDigits=2, std::string const prefixForPositiveNumbers="+", std::string const prefixForNegativeNumbers="-", std::string const positiveExponentPrefix="+", std::string const negativeExponentPrefix="-", std::string const exponentCharacter="E")
Definition: StringParser.cpp:441

BOL::StringParser::firstWordOf
static std::string firstWordOf(std::string const &stringToParse, std::string *const remainderString=NULL, std::string const &separatorChars=whitespaceChars)
Definition: StringParser.cpp:400

BOL::StringParser::uppercaseAlphabetChars
static std::string const uppercaseAlphabetChars
Definition: StringParser.hpp:39

BOL::StringParser::lowercaseAlphabetChars
static std::string const lowercaseAlphabetChars
Definition: StringParser.hpp:38

BOL::StringParser::positiveExponentPrefix
std::string positiveExponentPrefix
Definition: StringParser.hpp:279

BOL::StringParser::whitespaceAndNewlineChars
static std::string const whitespaceAndNewlineChars
Definition: StringParser.hpp:37

BOL::StringParser::stringsMatchIgnoringCase
static bool stringsMatchIgnoringCase(std::string const &firstString, std::string const &secondString)
Definition: StringParser.cpp:220

BOL::StringParser::stringToIntVector
static std::vector< int > stringToIntVector(std::string stringToInterpret)
Definition: StringParser.cpp:323

BOL::StringParser::digitChars
static std::string const digitChars
Definition: StringParser.hpp:40

BOL::StringParser::intForSingleDigit
static int intForSingleDigit(char const singleDigitAsChar)
Definition: StringParser.cpp:500

BOL::StringParser::negativeExponentPrefix
std::string negativeExponentPrefix
Definition: StringParser.hpp:280

BOL::StringParser::whitespaceChars
static std::string const whitespaceChars
Definition: StringParser.hpp:35

BOL::StringParser::numberOfMantissaDigits
int numberOfMantissaDigits
Definition: StringParser.hpp:275

BOL::StringParser::stringIsDouble
static bool stringIsDouble(std::string const &stringToInterpret, double &doubleToSet)
Definition: StringParser.cpp:263

BOL::StringParser::newlineChars
static std::string const newlineChars
Definition: StringParser.hpp:36

BOL::StringParser::trimFromFrontAndBack
static std::string trimFromFrontAndBack(std::string const &stringToTrim, std::string const &charsToTrim=whitespaceAndNewlineChars)
Definition: StringParser.hpp:502

BOL::StringParser::stringToDouble
static double stringToDouble(std::string const &stringToInterpret)
Definition: StringParser.hpp:422

BOL::StringParser::intToString
static std::string intToString(int inputInt, int const minimumNumberOfDigits, std::string const prefixForPositiveNumbers="+", std::string const prefixForNegativeNumbers="-", char const paddingChar='0')
Definition: StringParser.cpp:30

BOL::StringParser::lowercaseMinusUppercase
static char const lowercaseMinusUppercase
Definition: StringParser.hpp:258

BOL::StringParser::~StringParser
~StringParser()
Definition: StringParser.cpp:463

BOL::StringParser::charForSingleDigit
static char charForSingleDigit(int const singleDigitAsInt)
Definition: StringParser.cpp:470

BOL::StringParser::prefixForNegativeNumbers
std::string prefixForNegativeNumbers
Definition: StringParser.hpp:278

BOL::StringParser::positiveIntToString
static std::string positiveIntToString(int positiveInt)
Definition: StringParser.cpp:542

BOL::StringParser::numberOfExponentDigits
int numberOfExponentDigits
Definition: StringParser.hpp:276

BOL::StringParser::exponentCharacter
std::string exponentCharacter
Definition: StringParser.hpp:281

BOL::StringParser::doubleToString
static std::string doubleToString(double inputDouble, int const numberOfMantissaDigits, int const numberOfExponentDigits, std::string const prefixForPositiveNumbers="+", std::string const prefixForNegativeNumbers="-", std::string const positiveExponentPrefix="+", std::string const negativeExponentPrefix="-", std::string const exponentCharacter="E")
Definition: StringParser.cpp:78

BOL::StringParser::substituteCharacterWith
static void substituteCharacterWith(std::string &stringToTransform, char const charToBeReplaced, char const charToBePutIn)
Definition: StringParser.hpp:373

BOL::StringParser::substringToFirst
static std::string substringToFirst(std::string const &stringToParse, VectorlikeArray< std::string > const &delimitersOfSubstring, std::string *const remainderString=NULL)
Definition: StringParser.cpp:348

BOL::UsefulStuff::notANumber
static double const notANumber
Definition: UsefulStuff.hpp:28

BOL::UsefulStuff::nanString
static std::string const nanString
Definition: UsefulStuff.hpp:29

BOL::VectorlikeArray
Definition: VectorlikeArray.hpp:31

BOL::VectorlikeArray::getLastIndex
int getLastIndex() const
Definition: VectorlikeArray.hpp:289

BOL
Definition: ArgumentParser.hpp:23