libdap4/html/parser-util_8cc_source.html

// -*- mode: c++; c-basic-offset:4 -*-


// This file is part of libdap, A C++ implementation of the OPeNDAP Data

// Access Protocol.


// Copyright (c) 2002,2003 OPeNDAP, Inc.

// Author: James Gallagher <jgallagher@opendap.org>

//

// This library is free software; you can redistribute it and/or

// modify it under the terms of the GNU Lesser General Public

// License as published by the Free Software Foundation; either

// version 2.1 of the License, or (at your option) any later version.

//

// This library is distributed in the hope that it will be useful,

// but WITHOUT ANY WARRANTY; without even the implied warranty of

// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

// Lesser General Public License for more details.

//

// You should have received a copy of the GNU Lesser General Public

// License along with this library; if not, write to the Free Software

// Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA

//

// You can contact OPeNDAP, Inc. at PO Box 112, Saunderstown, RI. 02874-0112.


// (c) COPYRIGHT URI/MIT 1995-1999

// Please read the full copyright statement in the file COPYRIGHT_URI.

//

// Authors:

//      jhrg,jimg       James Gallagher <jgallagher@gso.uri.edu>


// These functions are utility functions used by the various DAP parsers (the

// DAS, DDS and constraint expression parsers).

// jhrg 9/7/95


#include "config.h"


#include <cassert>

#include <cerrno>

#include <cmath>

#include <cstdlib>

#include <cstring>


#include <iostream>

#include <sstream>


//  We wrap VC++ 6.x strtod() to account for a short comming

//  in that function in regards to "NaN".

#ifdef WIN32

#include <limits>

double w32strtod(const char *, char **);

#endif


#include "Error.h"

#include "debug.h"

#include "dods-limits.h"

#include "parser.h" // defines constants such as ID_MAX

#include "util.h"   // Jose Garcia: for append_long_to_string.


using std::cerr;

using std::endl;


#ifdef WIN32

//  VC++ 6.x strtod() doesn't recognize "NaN".  Account for it

//  by wrapping it around a check for the Nan string.  Use of

//  the product is obsolete as of 1/2007, but it is unknown if

//  the issue is still there in later releases of that product.

//  ROM - 01/2007

double w32strtod(const char *val, char **ptr) {

    //  Convert the two char arrays to compare to strings.

    string *sval = new string(val);

    string *snan = new string("NaN");


    //  If val doesn't contain "NaN|Nan|nan|etc", use strtod as

    //  provided.

    if (stricmp(sval->c_str(), snan->c_str()) != 0)

        return (strtod(val, ptr));


    //  But if it does, return the bit pattern for Nan and point

    //  the parsing ptr arg at the trailing '\0'.

    *ptr = (char *)val + strlen(val);

    return (std::numeric_limits<double>::quiet_NaN());

}

#endif


namespace libdap {


// Deprecated, but still used by the HDF4 EOS server code.


void parse_error(parser_arg *arg, const char *msg, const int line_num, const char *context) {

    // Jose Garcia

    // This assert(s) is (are) only for developing purposes

    // For production servers remove it by compiling with NDEBUG

    assert(arg);

    assert(msg);


    arg->set_status(FALSE);


    string oss = "";


    if (line_num != 0) {

        oss += "Error parsing the text on line ";

        append_long_to_string(line_num, 10, oss);

    } else {

        oss += "Parse error.";

    }


    if (context)

        oss += (string) " at or near: " + context + (string) "\n" + msg + (string) "\n";

    else

        oss += (string) "\n" + msg + (string) "\n";


    arg->set_error(new Error(unknown_error, oss));

}


void parse_error(const char *msg, const int line_num, const char *context) {

    // Jose Garcia

    // This assert(s) is (are) only for developing purposes

    // For production servers remove it by compiling with NDEBUG

    assert(msg);


    string oss = "";


    if (line_num != 0) {

        oss += "Error parsing the text on line ";

        append_long_to_string(line_num, 10, oss);

    } else {

        oss += "Parse error.";

    }


    if (context)

        oss += (string) " at or near: " + context + (string) "\n" + msg + (string) "\n";

    else

        oss += (string) "\n" + msg + (string) "\n";


    throw Error(malformed_expr, oss);

}


// context comes from the parser and will always be a char * unless the

// parsers change dramatically.


void parse_error(const string &msg, const int line_num, const char *context) {

    parse_error(msg.c_str(), line_num, context);

}


#if 0

// Remove this since it is not used and contains a potential (low level) vulnerability.

// jhrg 3/7/22

void save_str(char *dst, const char *src, const int line_num)

{

    if (strlen(src) >= ID_MAX)

        parse_error(string("The word `") + string(src)

                    + string("' is too long (it should be no longer than ")

                    + long_to_string(ID_MAX) + string(")."), line_num);


    strncpy(dst, src, ID_MAX);

    dst[ID_MAX - 1] = '\0';     /* in case ... */

}

#endif


void save_str(string &dst, const char *src, const int) { dst = src; }


bool is_keyword(string id, const string &keyword) {

    downcase(id);

    id = prune_spaces(id);

    DBG(cerr << "is_keyword: " << keyword << " = " << id << endl);

    return id == keyword;

}


int check_byte(const char *val) {

    char *ptr;

    long v = strtol(val, &ptr, 0);


    if ((v == 0 && val == ptr) || *ptr != '\0') {

        return FALSE;

    }


    DBG(cerr << "v: " << v << endl);


    // We're very liberal here with values. Anything that can fit into 8 bits

    // is allowed through. Clients will have to deal with the fact that the

    // ASCII representation for the value might need to be tweaked. This is

    // especially the case for Java clients where Byte datatypes are

    // signed. 3/20/2000 jhrg

    if ((v < 0 && v < DODS_SCHAR_MIN) || (v > 0 && static_cast<unsigned long>(v) > DODS_UCHAR_MAX))

        return FALSE;


    return TRUE;

}


// This version of check_int will pass base 8, 10 and 16 numbers when they

// use the ANSI standard for string representation of those number bases.


int check_int16(const char *val) {

    char *ptr;

    long v = strtol(val, &ptr, 0); // `0' --> use val to determine base


    if ((v == 0 && val == ptr) || *ptr != '\0') {

        return FALSE;

    }

    // Don't use the constant from limits.h, use the ones in dods-limits.h

    if (v > DODS_SHRT_MAX || v < DODS_SHRT_MIN) {

        return FALSE;

    }


    return TRUE;

}


int check_uint16(const char *val) {

    char *ptr;

    unsigned long v = strtol(val, &ptr, 0);


    if ((v == 0 && val == ptr) || *ptr != '\0') {

        return FALSE;

    }


    if (v > DODS_USHRT_MAX) {

        return FALSE;

    }


    return TRUE;

}


int check_int32(const char *val) {

    char *ptr;

    errno = 0;

    long v = strtol(val, &ptr, 0); // `0' --> use val to determine base


    if ((v == 0 && val == ptr) || *ptr != '\0') {

        return FALSE;

    }


    // We need to check errno since strtol return clamps on overflow so the

    // check against the DODS values below will always pass, even for out of

    // bounds values in the string. mjohnson 7/20/09

    if (errno == ERANGE) {

        return FALSE;

    }

    // This could be combined with the above, or course, but I'm making it

    // separate to highlight the test. On 64-bit linux boxes 'long' may be

    // 64-bits and so 'v' can hold more than a DODS_INT32. jhrg 3/23/10

    else if (v > DODS_INT_MAX || v < DODS_INT_MIN) {

        return FALSE;

    } else {

        return TRUE;

    }

}


int check_uint32(const char *val) {

    // Eat whitespace and check for an initial '-' sign...

    // strtoul allows an initial minus. mjohnson

    const char *c = val;

    while (c && isspace(*c)) {

        c++;

    }

    if (c && (*c == '-')) {

        return FALSE;

    }


    char *ptr;

    errno = 0;

    unsigned long v = strtoul(val, &ptr, 0);


    if ((v == 0 && val == ptr) || *ptr != '\0') {

        return FALSE;

    }


    // check overflow first, or the below check is invalid due to

    // clamping to the maximum value by strtoul

    // maybe consider using long long for these checks? mjohnson

    if (errno == ERANGE) {

        return FALSE;

    }

    // See above.

    else if (v > DODS_UINT_MAX) {

        return FALSE;

    } else {

        return TRUE;

    }

}


int check_int32(const char *val, int &v) {

    char *ptr;

    errno = 0;

    long tmp = strtol(val, &ptr, 0); // `0' --> use val to determine base


    if ((tmp == 0 && val == ptr) || *ptr != '\0') {

        return FALSE;

    }


    // We need to check errno since strtol return clamps on overflow so the

    // check against the DODS values below will always pass, even for out of

    // bounds values in the string. mjohnson 7/20/09

    if (errno == ERANGE) {

        return FALSE;

    }

    // This could be combined with the above, or course, but I'm making it

    // separate to highlight the test. On 64-bit linux boxes 'long' may be

    // 64-bits and so 'v' can hold more than a DODS_INT32. jhrg 3/23/10

    else if (tmp > DODS_INT_MAX || tmp < DODS_INT_MIN) {

        return FALSE;

    } else {

        v = (int)tmp;

        return TRUE;

    }

}


int check_uint32(const char *val, unsigned int &v) {

    // Eat whitespace and check for an initial '-' sign...

    // strtoul allows an initial minus. mjohnson

    const char *c = val;

    while (c && isspace(*c)) {

        c++;

    }

    if (c && (*c == '-')) {

        return FALSE;

    }


    char *ptr;

    errno = 0;

    unsigned long tmp = strtoul(val, &ptr, 0);


    if ((tmp == 0 && val == ptr) || *ptr != '\0') {

        return FALSE;

    }


    // check overflow first, or the below check is invalid due to

    // clamping to the maximum value by strtoul

    // maybe consider using long long for these checks? mjohnson

    if (errno == ERANGE) {

        return FALSE;

    }

    // See above.

    else if (tmp > DODS_UINT_MAX) {

        return FALSE;

    } else {

        v = (unsigned int)tmp;

        return TRUE;

    }

}


int check_int64(const char *val) {

    char *ptr;

    errno = 0;

    long long v = strtoll(val, &ptr, 0); // `0' --> use val to determine base


    if ((v == 0 && val == ptr) || *ptr != '\0') {

        return FALSE;

    }


    // We need to check errno since strtol return clamps on overflow so the

    // check against the DODS values below will always pass, even for out of

    // bounds values in the string. mjohnson 7/20/09

    if (errno == ERANGE) {

        return FALSE;

    }

#if 0

    // This could be combined with the above, or course, but I'm making it

    // separate to highlight the test. On 64-bit linux boxes 'long' may be

    // 64-bits and so 'v' can hold more than a DODS_INT32. jhrg 3/23/10

    //

    // Removed - Coverity says it can never be false. Makes sense. jhrg 5/10/16

    else if (v <= DODS_LLONG_MAX && v >= DODS_LLONG_MIN) {

        return FALSE;

    }

#endif

    else {

        return TRUE;

    }

}


int check_uint64(const char *val) {

    // Eat whitespace and check for an initial '-' sign...

    // strtoul allows an initial minus. mjohnson

    const char *c = val;

    while (c && isspace(*c)) {

        c++;

    }

    if (c && (*c == '-')) {

        return FALSE;

    }


    char *ptr;

    errno = 0;

    unsigned long long v = strtoull(val, &ptr, 0);


    if ((v == 0 && val == ptr) || *ptr != '\0') {

        return FALSE;

    }


    if (errno == ERANGE) {

        return FALSE;

    } else if (v > DODS_ULLONG_MAX) { // 2^61

        return FALSE;

    } else {

        return v;

    }

}


// Check first for system errors (like numbers so small they convert

// (erroneously) to zero. Then make sure that the value is within

// limits.


int check_float32(const char *val) {

    char *ptr;

    errno = 0; // Clear previous value. Fix for the 64bit

               // IRIX from Rob Morris. 5/21/2001 jhrg


#ifdef WIN32

    double v = w32strtod(val, &ptr);

#else

    double v = strtod(val, &ptr);

#endif


    DBG(cerr << "v: " << v << ", ptr: " << ptr << ", errno: " << errno << ", val==ptr: " << (val == ptr) << endl);


    if (errno == ERANGE || (v == 0.0 && val == ptr) || *ptr != '\0')

        return FALSE;


#if 0

    if ((v == 0.0 && (val == ptr || errno == HUGE_VAL || errno == ERANGE))

        || *ptr != '\0') {

        return FALSE;

    }

#endif


    DBG(cerr << "fabs(" << val << ") = " << fabs(v) << endl);

    double abs_val = fabs(v);

    if (abs_val > DODS_FLT_MAX || (abs_val != 0.0 && abs_val < DODS_FLT_MIN))

        return FALSE;


    return TRUE;

}


int check_float64(const char *val) {

    DBG(cerr << "val: " << val << endl);

    char *ptr;

    errno = 0; // Clear previous value. 5/21/2001 jhrg


#ifdef WIN32

    double v = w32strtod(val, &ptr);

#else

    double v = strtod(val, &ptr);

#endif


    DBG(cerr << "v: " << v << ", ptr: " << ptr << ", errno: " << errno << ", val==ptr: " << (val == ptr) << endl);


    if (errno == ERANGE || (v == 0.0 && val == ptr) || *ptr != '\0')

        return FALSE;

#if 0

    if ((v == 0.0 && (val == ptr || errno == HUGE_VAL || errno == ERANGE))

        || *ptr != '\0') {

        return FALSE;

    }

#endif

    DBG(cerr << "fabs(" << val << ") = " << fabs(v) << endl);

    double abs_val = fabs(v);

    if (abs_val > DODS_DBL_MAX || (abs_val != 0.0 && abs_val < DODS_DBL_MIN))

        return FALSE;


    return TRUE;

}


int check_float64(const char *val, double &v) {

    DBG(cerr << "val: " << val << endl);

    char *ptr;

    errno = 0; // Clear previous value. 5/21/2001 jhrg


#ifdef WIN32

    v = w32strtod(val, &ptr);

#else

    v = strtod(val, &ptr);

#endif


    DBG(cerr << "v: " << v << ", ptr: " << ptr << ", errno: " << errno << ", val==ptr: " << (val == ptr) << endl);


    if (errno == ERANGE || (v == 0.0 && val == ptr) || *ptr != '\0')

        return FALSE;

#if 0

        if ((v == 0.0 && (val == ptr || errno == HUGE_VAL || errno == ERANGE))

        || *ptr != '\0') {

        return FALSE;

    }

#endif

    DBG(cerr << "fabs(" << val << ") = " << fabs(v) << endl);

    double abs_val = fabs(v);

    if (abs_val > DODS_DBL_MAX || (abs_val != 0.0 && abs_val < DODS_DBL_MIN))

        return FALSE;


    return TRUE;

}


long long get_int64(const char *val) {

    char *ptr;

    errno = 0;

    long long v = strtoll(val, &ptr, 0); // `0' --> use val to determine base


    if ((v == 0 && val == ptr) || *ptr != '\0') {

        throw Error("Expected a 64-bit integer, but found other characters.");

        // The value '" + string(val) + "' contains extra characters.");

    }


    // We need to check errno since strtol return clamps on overflow so the

    // check against the DODS values below will always pass, even for out of

    // bounds values in the string. mjohnson 7/20/09

    if (errno == ERANGE) {

        throw Error("The 64-bit integer value is out of range.");

    }


#if 0

        // This could be combined with the above, or course, but I'm making it

    // separate to highlight the test. On 64-bit linux boxes 'long' may be

    // 64-bits and so 'v' can hold more than a DODS_INT32. jhrg 3/23/10

    //

    // Removed because coverity flags it as useless, which it is until we

    // have 128-bit ints... jhrg 5/9/16

    else if (v > DODS_LLONG_MAX || v < DODS_LLONG_MIN) {

        throw Error("The value '" + string(val) + "' is out of range.");

    }

#endif


    else {

        return v;

    }

}


unsigned long long get_uint64(const char *val) {

    // Eat whitespace and check for an initial '-' sign...

    // strtoul allows an initial minus. mjohnson

    const char *c = val;

    while (c && isspace(*c)) {

        c++;

    }

    if (c && (*c == '-')) {

        throw Error("Expected a valid array index.");

    }


    char *ptr;

    errno = 0;

    unsigned long long v = strtoull(val, &ptr, 0);


    if ((v == 0 && val == ptr) || *ptr != '\0') {

        throw Error("Expected an unsigned 64-bit integer, but found other characters.");

    }


    if (errno == ERANGE) {

        throw Error("The 64-bit integer value is out of range.");

    }

#if 0

        // Coverity; see above. jhrg 5/9/16

    else if (v > DODS_MAX_ARRAY_INDEX) { // 2^61

        throw Error("The value '" + string(val) + "' is out of range.");

    }

#endif

    else {

        return v;

    }

}


int get_int32(const char *val) {

    char *ptr;

    errno = 0;

    int v = strtol(val, &ptr, 0); // `0' --> use val to determine base


    if ((v == 0 && val == ptr) || *ptr != '\0') {

        throw Error("Expected a 32-bit integer, but found other characters.");

    }


    // We need to check errno since strtol return clamps on overflow so the

    // check against the DODS values below will always pass, even for out of

    // bounds values in the string. mjohnson 7/20/09

    if (errno == ERANGE) {

        throw Error("The 32-bit integer value is out of range.");

    }

    // This could be combined with the above, or course, but I'm making it

    // separate to highlight the test. On 64-bit linux boxes 'long' may be

    // 64-bits and so 'v' can hold more than a DODS_INT32. jhrg 3/23/10

    else if (v > DODS_INT_MAX || v < DODS_INT_MIN) {

        return FALSE;

    }


    else {

        return v;

    }

}


unsigned int get_uint32(const char *val) {

    // Eat whitespace and check for an initial '-' sign...

    // strtoul allows an initial minus. mjohnson

    const char *c = val;

    while (c && isspace(*c)) {

        c++;

    }

    if (c && (*c == '-')) {

        throw Error("Expected an unsigned 32-bit integer, but found other characters.");

    }


    char *ptr;

    errno = 0;

    unsigned int v = strtoul(val, &ptr, 0);


    if ((v == 0 && val == ptr) || *ptr != '\0') {

        throw Error("Expected an unsigned 32-bit integer, but found other characters.");

    }


    if (errno == ERANGE) {

        throw Error("The 32-bit integer value is out of range.");

    }

    // See above.

    else if (v > DODS_UINT_MAX) {

        return FALSE;

    } else {

        return v;

    }

}


double get_float64(const char *val) {

    DBG(cerr << "val: " << val << endl);

    char *ptr;

    errno = 0; // Clear previous value. 5/21/2001 jhrg


#ifdef WIN32

    double v = w32strtod(val, &ptr);

#else

    double v = strtod(val, &ptr);

#endif


    if (errno == ERANGE || (v == 0.0 && val == ptr) || *ptr != '\0')

        throw Error("The 64-bit floating point value is out of range.");

    ;


    DBG(cerr << "fabs(" << val << ") = " << fabs(v) << endl);

    double abs_val = fabs(v);

    if (abs_val > DODS_DBL_MAX || (abs_val != 0.0 && abs_val < DODS_DBL_MIN))

        throw Error("The 64-bit floating point value is out of range.");

    ;


    return v;

}


/*

  Maybe someday we will really check the Urls to see if they are valid...

*/


int check_url(const char *) { return TRUE; }


} // namespace libdap

Error.h

unknown_error
#define unknown_error
Unknown error (the default code) (HTTP 400)
Definition Error.h:62

malformed_expr
#define malformed_expr
(400)
Definition Error.h:66

libdap::Error
A class for error processing.
Definition Error.h:92

config.h

debug.h

DBG
#define DBG(x)
Definition debug.h:58

dods-limits.h

DODS_DBL_MAX
#define DODS_DBL_MAX
Definition dods-limits.h:87

DODS_DBL_MIN
#define DODS_DBL_MIN
Definition dods-limits.h:89

DODS_SHRT_MIN
#define DODS_SHRT_MIN
Definition dods-limits.h:68

DODS_UCHAR_MAX
#define DODS_UCHAR_MAX
Definition dods-limits.h:65

DODS_SCHAR_MIN
#define DODS_SCHAR_MIN
Definition dods-limits.h:63

DODS_SHRT_MAX
#define DODS_SHRT_MAX
Definition dods-limits.h:69

DODS_UINT_MAX
#define DODS_UINT_MAX
Definition dods-limits.h:74

DODS_MAX_ARRAY_INDEX
#define DODS_MAX_ARRAY_INDEX
Definition dods-limits.h:84

DODS_LLONG_MAX
#define DODS_LLONG_MAX
Definition dods-limits.h:81

DODS_INT_MAX
#define DODS_INT_MAX
Definition dods-limits.h:73

DODS_FLT_MIN
#define DODS_FLT_MIN
Definition dods-limits.h:93

DODS_INT_MIN
#define DODS_INT_MIN
Definition dods-limits.h:72

DODS_USHRT_MAX
#define DODS_USHRT_MAX
Definition dods-limits.h:70

DODS_FLT_MAX
#define DODS_FLT_MAX
Definition dods-limits.h:92

DODS_LLONG_MIN
#define DODS_LLONG_MIN
Definition dods-limits.h:80

DODS_ULLONG_MAX
#define DODS_ULLONG_MAX
Definition dods-limits.h:82

libdap::check_float64
int check_float64(const char *val)
Definition parser-util.cc:443

libdap::check_uint64
int check_uint64(const char *val)
Definition parser-util.cc:380

libdap::check_url
int check_url(const char *)
Is the value a valid URL?
Definition parser-util.cc:653

libdap::check_uint16
int check_uint16(const char *val)
Definition parser-util.cc:217

libdap::check_int64
int check_int64(const char *val)
Definition parser-util.cc:350

libdap::check_byte
int check_byte(const char *val)
Is the value a valid byte?
Definition parser-util.cc:178

libdap::check_uint32
int check_uint32(const char *val)
Definition parser-util.cc:257

libdap::check_int16
int check_int16(const char *val)
Definition parser-util.cc:202

libdap::check_float32
int check_float32(const char *val)
Definition parser-util.cc:412

libdap::check_int32
int check_int32(const char *val)
Definition parser-util.cc:232

libdap::get_float64
double get_float64(const char *val)
Definition parser-util.cc:625

libdap::get_int64
long long get_int64(const char *val)
Definition parser-util.cc:501

libdap::get_uint32
unsigned int get_uint32(const char *val)
Definition parser-util.cc:595

libdap::get_int32
int get_int32(const char *val)
Definition parser-util.cc:568

libdap::get_uint64
unsigned long long get_uint64(const char *val)
Definition parser-util.cc:535

TRUE
#define TRUE
Definition gse_parser.h:32

FALSE
#define FALSE
Definition gse_parser.h:33

ID_MAX
#define ID_MAX
Definition gse_parser.h:29

libdap
top level DAP object to house generic methods
Definition AISConnect.cc:30

libdap::long_to_string
string long_to_string(long val, int base)
Definition util.cc:946

libdap::prune_spaces
string prune_spaces(const string &name)
Definition util.cc:451

libdap::save_str
void save_str(string &dst, const char *src, const int)
Save a string to a temporary variable during the parse.
Definition parser-util.cc:159

libdap::append_long_to_string
void append_long_to_string(long val, int base, string &str_val)
Definition util.cc:919

libdap::downcase
void downcase(string &s)
Definition util.cc:544

libdap::parse_error
void parse_error(parser_arg *arg, const char *msg, const int line_num, const char *context)
Definition parser-util.cc:89

libdap::is_keyword
bool is_keyword(string id, const string &keyword)
Definition parser-util.cc:161

parser.h

libdap::parser_arg
Pass parameters by reference to a parser.
Definition parser.h:67

libdap::parser_arg::set_error
void set_error(Error *obj)
Definition parser.h:84

libdap::parser_arg::set_status
void set_status(int val=0)
Definition parser.h:86

util.h