doc/v626/RooStreamParser_8cxx_source.html

/*****************************************************************************

 * Project: RooFit                                                           *

 * Package: RooFitCore                                                       *

 * @(#)root/roofitcore:$Id$

 * Authors:                                                                  *

 *   WV, Wouter Verkerke, UC Santa Barbara, verkerke@slac.stanford.edu       *

 *   DK, David Kirkby,    UC Irvine,         dkirkby@uci.edu                 *

 *                                                                           *

 * Copyright (c) 2000-2005, Regents of the University of California          *

 *                          and Stanford University. All rights reserved.    *

 *                                                                           *

 * Redistribution and use in source and binary forms,                        *

 * with or without modification, are permitted according to the terms        *

 * listed in LICENSE (http://roofit.sourceforge.net/license.txt)             *

 *****************************************************************************/


//////////////////////////////////////////////////////////////////////////////

//

// RooStreamParser is a utility class to parse istreams into tokens and optionally

// convert them into basic types (double,int,string)

//

// The general tokenizing philosophy is that there are two kinds of tokens: value

// and punctuation. The former are variable length, the latter always

// one character. A token is terminated if one of the following conditions

// occur

//         - space character found (' ',tab,newline)

//         - change of token type (value -> punctuation or vv)

//         - end of fixed-length token (punctuation only)

//         - start or end of quoted string

//

// The parser is aware of floating point notation and will assign leading

// minus signs, decimal points etc to a value token when this is obvious

// from the context. The definition of what is punctuation can be redefined.

//


#include "RooFit.h"


#include "Riostream.h"

#include <stdlib.h>


#ifndef _WIN32

#include <strings.h>

#endif


#include "RooStreamParser.h"

#include "RooMsgService.h"

#include "RooNumber.h"


using namespace std;


ClassImp(RooStreamParser);


////////////////////////////////////////////////////////////////////////////////

/// Construct parser on given input stream


RooStreamParser::RooStreamParser(istream& is) :

  _is(&is), _atEOL(kFALSE), _atEOF(kFALSE), _prefix(""), _punct("()[]<>|/\\:?.,=+-&^%$#@!`~")

{

}


////////////////////////////////////////////////////////////////////////////////

/// Construct parser on given input stream. Use given errorPrefix to

/// prefix any parsing error messages


RooStreamParser::RooStreamParser(istream& is, const TString& errorPrefix) :

  _is(&is), _atEOL(kFALSE), _atEOF(kFALSE), _prefix(errorPrefix), _punct("()[]<>|/\\:?.,=+-&^%$#@!`~")

{

}


////////////////////////////////////////////////////////////////////////////////

/// Destructor


RooStreamParser::~RooStreamParser()

{

}


////////////////////////////////////////////////////////////////////////////////

/// If true, parser is at end of line in stream


Bool_t RooStreamParser::atEOL()

{

  Int_t nc(_is->peek()) ;

  return (nc=='\n'||nc==-1) ;

}


////////////////////////////////////////////////////////////////////////////////

/// Change list of characters interpreted as punctuation


void RooStreamParser::setPunctuation(const TString& punct)

{

  _punct = punct ;

}


////////////////////////////////////////////////////////////////////////////////

/// Check if given char is considered punctuation


Bool_t RooStreamParser::isPunctChar(char c) const

{

  const char* punct = _punct.Data() ;

  for (int i=0 ; i<_punct.Length() ; i++)

    if (punct[i] == c) {

      return kTRUE ;

    }

  return kFALSE ;

}


////////////////////////////////////////////////////////////////////////////////

/// Read one token separated by any of the know punctuation characters

/// This function recognizes and handles comment lines in the istream (those

/// starting with '#', quoted strings ("") the content of which is not tokenized

/// and '+-.' characters that are part of a floating point numbers and are exempt

/// from being interpreted as a token separator in case '+-.' are defined as

/// token separators.


TString RooStreamParser::readToken()

{

  // Smart tokenizer. Absorb white space and token must be either punctuation or alphanum

  Bool_t first(kTRUE), quotedString(kFALSE), lineCont(kFALSE) ;

  char buffer[64000], c(0), cnext = '\0', cprev = ' ';

  Bool_t haveINF(kFALSE) ;

  Int_t bufptr(0) ;


  // Check for end of file

  if (_is->eof() || _is->fail()) {

    _atEOF = kTRUE ;

    return TString("") ;

  }


  //Ignore leading newline

  if (_is->peek()=='\n') {

    _is->get(c) ;


    // If new line starts with #, zap it

    while (_is->peek()=='#') {

      zapToEnd(kFALSE) ;

      _is->get(c) ; // absorb newline

    }

  }


  while(1) {

    // Buffer overflow protection

    if (bufptr >= 63999) {

      oocoutW((TObject *)0, InputArguments)

              << "RooStreamParser::readToken: token length exceeds buffer capacity, terminating token early" << endl;

      break;

    }


    // Read next char

    _is->get(c) ;


    // Terminate at EOF, EOL or trouble

    if (_is->eof() || _is->fail() || c=='\n') break ;


    // Terminate as SPACE, unless we haven't seen any non-SPACE yet

    if (isspace(c)) {

      if (first)

        continue ;

      else

        if (!quotedString) {

          break ;

        }

    }


    // If '-' or '/' see what the next character is

    if (c == '.' || c=='-' || c=='+' || c=='/' || c=='\\') {

      _is->get(cnext) ;


      if (cnext=='I' || cnext=='i') {

        char tmp1,tmp2 ;

        _is->get(tmp1) ;

        _is->get(tmp2) ;

        _is->putback(tmp2) ;

        _is->putback(tmp1) ;

        haveINF = ((cnext=='I' && tmp1 == 'N' && tmp2 == 'F') || (cnext=='i' && tmp1 == 'n' && tmp2 == 'f')) ;

      } else {

        haveINF = kFALSE ;

      }


      _is->putback(cnext) ;

    }


    // Check for line continuation marker

    if (c=='\\' && cnext=='\\') {

      // Kill rest of line including endline marker

      zapToEnd(kFALSE) ;

      _is->get(c) ;

      lineCont=kTRUE ;

      break ;

    }


    // Stop if begin of comments is encountered

    if (c=='/' && cnext=='/') {

      zapToEnd(kFALSE) ;

      break ;

    }


    // Special handling of quoted strings

    if (c=='"') {

      if (first) {

        quotedString=kTRUE ;

      } else if (!quotedString) {

        // Terminate current token. Next token will be quoted string

        _is->putback('"') ;

        break ;

      }

    }


    if (!quotedString) {

      // Decide if next char is punctuation (exempt - and . that are part of floating point numbers, or +/- preceding INF)

      if (isPunctChar(c) && !(c=='.' && (isdigit(cnext)||isdigit(cprev)))

          && !((c=='-'||c=='+') && isdigit(cnext) && (cprev == 'e' || cprev == 'E'))

          && (!first || !((c=='-'||c=='+') && (isdigit(cnext)||cnext=='.'||haveINF)))) {


        if (first) {

          // Make this a one-char punctuation token

          buffer[bufptr++]=c ;

          break ;

        } else {

          // Put back punct. char and terminate current alphanum token

          _is->putback(c) ;

          break ;

        }

      }

    } else {

      // Inside quoted string conventional tokenizing rules do not apply


      // Terminate token on closing quote

      if (c=='"' && !first) {

        buffer[bufptr++]=c ;

        quotedString=kFALSE ;

        break ;

      }

    }


    // Store in buffer

    buffer[bufptr++]=c ;

    first=kFALSE ;

    cprev=c ;

  }


  if (_is->eof() || _is->bad()) {

    _atEOF = kTRUE ;

  }


  // Check if closing quote was encountered

  if (quotedString) {

    oocoutW((TObject*)0,InputArguments) << "RooStreamParser::readToken: closing quote (\") missing" << endl ;

  }


  // Absorb trailing white space or absorb rest of line if // is encountered

  if (c=='\n') {

    if (!lineCont) {

      _is->putback(c) ;

    }

  } else {

    c = _is->peek() ;


    while ((isspace(c) || c=='/') && c != '\n') {

      if (c=='/') {

        _is->get(c) ;

        if (_is->peek()=='/') {

          zapToEnd(kFALSE) ;

        } else {

          _is->putback('/') ;

        }

        break ;

      } else {

        _is->get(c) ;

        c = _is->peek() ;

      }

    }

  }


  // If no token was read line is continued, return first token on next line

  if (bufptr==0 && lineCont) {

    return readToken() ;

  }


  // Zero terminate buffer and convert to TString

  buffer[bufptr]=0 ;

  return TString(buffer) ;

}


////////////////////////////////////////////////////////////////////////////////

/// Read an entire line from the stream and return as TString

/// This method recognizes the use of '\\' in the istream

/// as line continuation token.


TString RooStreamParser::readLine()

{

   char c, buffer[64000];

   Int_t nfree(63999);


   if (_is->peek() == '\n')

      _is->get(c);


   // Read till end of line

   _is->getline(buffer, nfree, '\n');


   // Look for eventual continuation line sequence

   char *pcontseq = strstr(buffer, "\\\\");

   if (pcontseq)

      nfree -= (pcontseq - buffer);

   while (pcontseq) {

      _is->getline(pcontseq, nfree, '\n');


      char *nextpcontseq = strstr(pcontseq, "\\\\");

      if (nextpcontseq)

         nfree -= (nextpcontseq - pcontseq);

      pcontseq = nextpcontseq;

  }


  // Chop eventual comments

  char *pcomment = strstr(buffer,"//") ;

  if (pcomment) *pcomment=0 ;


  // Chop leading and trailing space

  char *pstart=buffer ;

  while (isspace(*pstart)) {

    pstart++ ;

  }

  char *pend=buffer+strlen(buffer)-1 ;

  if (pend>pstart)

    while (isspace(*pend)) { *pend--=0 ; }


  if (_is->eof() || _is->fail()) {

    _atEOF = kTRUE ;

  }


  // Convert to TString

  return TString(pstart) ;

}


////////////////////////////////////////////////////////////////////////////////

/// Eat all characters up to and including then end of the

/// current line. If inclContLines is kTRUE, all continuation lines

/// marked by the '\\' token are zapped as well


void RooStreamParser::zapToEnd(Bool_t inclContLines)

{

  // Skip over everything until the end of the current line

  if (_is->peek()!='\n') {


     char buffer[64000];

     Int_t nfree(63999);


     // Read till end of line

     _is->getline(buffer, nfree, '\n');


     if (inclContLines) {

        // Look for eventual continuation line sequence

        char *pcontseq = strstr(buffer, "\\\\");

        if (pcontseq)

           nfree -= (pcontseq - buffer);

        while (pcontseq) {

           _is->getline(pcontseq, nfree, '\n');


           char *nextpcontseq = strstr(pcontseq, "\\\\");

           if (nextpcontseq)

              nfree -= (nextpcontseq - pcontseq);

           pcontseq = nextpcontseq;

        }

    }


    // Put back newline character in stream buffer

   _is->putback('\n') ;

  }

}


////////////////////////////////////////////////////////////////////////////////

/// Read the next token and return kTRUE if it is identical to the given 'expected' token.


Bool_t RooStreamParser::expectToken(const TString& expected, Bool_t zapOnError)

{

  TString token(readToken()) ;


  Bool_t error=token.CompareTo(expected) ;

  if (error && !_prefix.IsNull()) {

    oocoutW((TObject*)0,InputArguments) << _prefix << ": parse error, expected '"

               << expected << "'" << ", got '" << token << "'" << endl ;

    if (zapOnError) zapToEnd(kTRUE) ;

  }

  return error ;

}


////////////////////////////////////////////////////////////////////////////////

/// Read the next token and convert it to a Double_t. Returns true

/// if an error occurred in reading or conversion


Bool_t RooStreamParser::readDouble(Double_t& value, Bool_t /*zapOnError*/)

{

  TString token(readToken()) ;

  if (token.IsNull()) return kTRUE ;

  return convertToDouble(token,value) ;


}


////////////////////////////////////////////////////////////////////////////////

/// Convert given string to a double. Return true if the conversion fails.


Bool_t RooStreamParser::convertToDouble(const TString& token, Double_t& value)

{

  char* endptr = 0;

  const char* data=token.Data() ;


  // Handle +/- infinity cases, (token is guaranteed to be >1 char long)

  if (!strcasecmp(data,"inf") || !strcasecmp(data+1,"inf")) {

    value = (data[0]=='-') ? -RooNumber::infinity() : RooNumber::infinity() ;

    return kFALSE ;

  }


  value = strtod(data,&endptr) ;

  Bool_t error = (endptr-data!=token.Length()) ;


  if (error && !_prefix.IsNull()) {

    oocoutE((TObject*)0,InputArguments) << _prefix << ": parse error, cannot convert '"

               << token << "'" << " to double precision" <<  endl ;

  }

  return error ;

}


////////////////////////////////////////////////////////////////////////////////

/// Read a token and convert it to an Int_t. Returns true

/// if an error occurred in reading or conversion


Bool_t RooStreamParser::readInteger(Int_t& value, Bool_t /*zapOnError*/)

{

  TString token(readToken()) ;

  if (token.IsNull()) return kTRUE ;

  return convertToInteger(token,value) ;

}


////////////////////////////////////////////////////////////////////////////////

/// Convert given string to an Int_t. Returns true if an error

/// occurred in conversion


Bool_t RooStreamParser::convertToInteger(const TString& token, Int_t& value)

{

  char* endptr = 0;

  const char* data=token.Data() ;

  value = strtol(data,&endptr,10) ;

  Bool_t error = (endptr-data!=token.Length()) ;


  if (error && !_prefix.IsNull()) {

    oocoutE((TObject*)0,InputArguments)<< _prefix << ": parse error, cannot convert '"

                   << token << "'" << " to integer" <<  endl ;

  }

  return error ;

}


////////////////////////////////////////////////////////////////////////////////

/// Read a string token. Returns true if an error occurred in reading

/// or conversion.  If a the read token is enclosed in quotation

/// marks those are stripped in the returned value


Bool_t RooStreamParser::readString(TString& value, Bool_t /*zapOnError*/)

{

  TString token(readToken()) ;

  if (token.IsNull()) return kTRUE ;

  return convertToString(token,value) ;

}


////////////////////////////////////////////////////////////////////////////////

/// Convert given token to a string (i.e. remove eventual quotation marks)


Bool_t RooStreamParser::convertToString(const TString& token, TString& string)

{

   // Transport to buffer

   char buffer[64000], *ptr;

   strncpy(buffer, token.Data(), 63999);

   if (token.Length() >= 63999) {

      oocoutW((TObject *)0, InputArguments) << "RooStreamParser::convertToString: token length exceeds 63999, truncated"

                                            << endl;

      buffer[63999] = 0;

  }

  int len = strlen(buffer) ;


  // Remove trailing quote if any

  if ((len) && (buffer[len-1]=='"'))

    buffer[len-1]=0 ;


  // Skip leading quote, if present

  ptr=(buffer[0]=='"') ? buffer+1 : buffer ;


  string = ptr ;

  return kFALSE ;

}

c
#define c(i)
Definition RSha256.hxx:101

Riostream.h

RooFit.h

RooMsgService.h

oocoutW
#define oocoutW(o, a)
Definition RooMsgService.h:47

oocoutE
#define oocoutE(o, a)
Definition RooMsgService.h:48

RooNumber.h

RooStreamParser.h

kFALSE
const Bool_t kFALSE
Definition RtypesCore.h:101

kTRUE
const Bool_t kTRUE
Definition RtypesCore.h:100

ClassImp
#define ClassImp(name)
Definition Rtypes.h:364

Double_t

RooNumber::infinity
static Double_t infinity()
Return internal infinity representation.
Definition RooNumber.cxx:49

RooStreamParser
Definition RooStreamParser.h:21

RooStreamParser::isPunctChar
Bool_t isPunctChar(char c) const
Check if given char is considered punctuation.
Definition RooStreamParser.cxx:109

RooStreamParser::atEOL
Bool_t atEOL()
If true, parser is at end of line in stream.
Definition RooStreamParser.cxx:88

RooStreamParser::readInteger
Bool_t readInteger(Int_t &value, Bool_t zapOnError=kFALSE)
Read a token and convert it to an Int_t.
Definition RooStreamParser.cxx:456

RooStreamParser::readDouble
Bool_t readDouble(Double_t &value, Bool_t zapOnError=kFALSE)
Read the next token and convert it to a Double_t.
Definition RooStreamParser.cxx:416

RooStreamParser::convertToDouble
Bool_t convertToDouble(const TString &token, Double_t &value)
Convert given string to a double. Return true if the conversion fails.
Definition RooStreamParser.cxx:429

RooStreamParser::readString
Bool_t readString(TString &value, Bool_t zapOnError=kFALSE)
Read a string token.
Definition RooStreamParser.cxx:490

RooStreamParser::setPunctuation
void setPunctuation(const TString &punct)
Change list of characters interpreted as punctuation.
Definition RooStreamParser.cxx:99

RooStreamParser::zapToEnd
void zapToEnd(Bool_t inclContLines=kFALSE)
Eat all characters up to and including then end of the current line.
Definition RooStreamParser.cxx:361

RooStreamParser::expectToken
Bool_t expectToken(const TString &expected, Bool_t zapOnError=kFALSE)
Read the next token and return kTRUE if it is identical to the given 'expected' token.
Definition RooStreamParser.cxx:397

RooStreamParser::~RooStreamParser
virtual ~RooStreamParser()
Destructor.
Definition RooStreamParser.cxx:79

RooStreamParser::_punct
TString _punct
Definition RooStreamParser.h:55

RooStreamParser::_is
std::istream * _is
Definition RooStreamParser.h:51

RooStreamParser::convertToInteger
Bool_t convertToInteger(const TString &token, Int_t &value)
Convert given string to an Int_t.
Definition RooStreamParser.cxx:469

RooStreamParser::readLine
TString readLine()
Read an entire line from the stream and return as TString This method recognizes the use of '\' in th...
Definition RooStreamParser.cxx:309

RooStreamParser::readToken
TString readToken()
Read one token separated by any of the know punctuation characters This function recognizes and handl...
Definition RooStreamParser.cxx:129

RooStreamParser::_prefix
TString _prefix
Definition RooStreamParser.h:54

RooStreamParser::_atEOF
Bool_t _atEOF
Definition RooStreamParser.h:53

RooStreamParser::convertToString
Bool_t convertToString(const TString &token, TString &string)
Convert given token to a string (i.e. remove eventual quotation marks)
Definition RooStreamParser.cxx:502

RooStreamParser::RooStreamParser
RooStreamParser(std::istream &is)
Construct parser on given input stream.
Definition RooStreamParser.cxx:59

TObject
Mother of all ROOT objects.
Definition TObject.h:41

TString
Basic string class.
Definition TString.h:136

TString::Length
Ssiz_t Length() const
Definition TString.h:410

TString::CompareTo
int CompareTo(const char *cs, ECaseCompare cmp=kExact) const
Compare a string to char *cs2.
Definition TString.cxx:442

TString::Data
const char * Data() const
Definition TString.h:369

TString::IsNull
Bool_t IsNull() const
Definition TString.h:407

bool

int

first
Definition first.py:1