Boost.Spirit grammar issue

Question

I am attempting to parse terminfo definitions text file. I am new to Boost.Spirit. I have started with simple grammar that only parses comment lines, empty lines and terminal definitions. As the code comment in the grammar shows, uncommenting the [_val = _1] for definition breaks compilation. Why? Can I fix it?

If I ignore the actual terminfo file, I expect the code below to parse this kind of text:

# comment line

first definition line
  second 
  third line

# another comment line

Code:

#include 
#include 
#include 
#include 
#include 
#include 
#include 
#include 
#include 
#include 

namespace termcxx
{

namespace parser
{

namespace qi = boost::spirit::qi;
namespace ascii = boost::spirit::ascii;
namespace px = boost::phoenix;

//using qi::double_;
using ascii::space;
//using px::ref;
using px::construct;

//using qi::eps;
//using qi::lit;
using qi::_val;
using qi::_1;
using ascii::char_;
using qi::eol;
using qi::eoi;


struct context
{
    int dummy;

    context () = default;
    context (context const &) = default;
    context (std::vector a)
    { }
    context (std::vector a, std::vector b)
    { }
};

} }


BOOST_FUSION_ADAPT_STRUCT(
    termcxx::parser::context,
    (int, dummy))


namespace termcxx
{

namespace parser
{

template 
struct parser
    : qi::grammar
{
    qi::rule > comment_line
    = (*space >> '#' >> *(char_ - eol) >> (eol | eoi))[_val = _1]
        ;

    qi::rule > empty_line
    = (*space >> (eol | eoi))[_val = _1]
        ;

    qi::rule > def_first_line
    = (+(char_ - eol) >> (eol | eoi))[_val = _1]
        ;

    qi::rule > def_subsequent_line
    = (+space >> +(char_ - eol) >> (eol | eoi))[_val = _1]
        ;

    qi::rule > definition
    = (def_first_line >> *def_subsequent_line)//[_val = _1] // Uncommenting the [_val = _1] breaks compilation. Why?
        ;

    qi::rule start
    = (*(comment_line
            | empty_line
            | definition))[_val = construct ()]
        ;

    parser()
        : parser::base_type(start)
    { }
};

template struct parser;

} // namespace parser

} // namespace termcxx

sehe · Accepted Answer

why do you insist on specifying [_val=_1]? It's redundant because the default attribute propagation does this. In fact it hurts, see below

Next, the attribute type of (def_first_line >> *def_subsequent_line) is (apparently) not compatible with std::vector. Perhaps you can

just use the default attribute propagation (which has enough smarts to just keep appending)
use raw[] to get the complete matched input
define BOOST_SPIRIT_ACTIONS_ALLOW_ATTR_COMPAT (I'm not sure this is well supported)

Also,

you can replace std::vector with std::string when relying on automatic attribute propagation
you can detect the actual exposed type of a parser expression: Detecting the parameter types in a Spirit semantic action

Update

A few more issues:

You had mispelled the attribute types for most rules (missing ()):

qi::rule comment_line;
qi::rule empty_line;
qi::rule def_first_line;
qi::rule def_subsequent_line;
qi::rule definition;

the empty_line matched at eoi leading to infinite loop at end of input

the use of char_ also accepts spaces (use graph instead:)

    def_first_line      = graph >> +(char_ - eol)         >> (eol|eoi);

the use of qi::space also eats line-ends! Use qi::blank instead

favour reability:

    empty_line          = *blank >> eol;
    comment_line        = *blank >> '#' >> *(char_ - eol) >> (eol|eoi);
    def_first_line      = graph >> +(char_ - eol)         >> (eol|eoi);
    def_subsequent_line = +blank >> +(char_ - eol)        >> (eol|eoi);

    definition          = (def_first_line >> *def_subsequent_line);

    start               = (  
                            *(comment_line | empty_line | definition)
                          ) [ _val = px::construct() ]
                          ;

This simple habit will save you hours and hours of work and your sanity when working with Spirit.

You could simplify the includes somewhat

Here's a fixed up version Live On Coliru with output:


  # comment line

firs
  
    # comment line

firs
    
first definition li
    [[ , c, o, m, m, e, n, t,  , l, i, n, e]]
  
  
    
first definition li
    
  
  
    
first definition li
    first definition lin
    [[]]
  
  
    first definition lin
    
  
  
    first definition lin
    
  
  
    first definition lin
    
      first definition lin
        second 
  third li
      [[f, i, r, s, t,  , d, e, f, i, n, i, t, i, o, n,  , l, i, n, e]]
    
    
        second 
  third li
        third line

# anot
      [[f, i, r, s, t,  , d, e, f, i, n, i, t, i, o, n,  , l, i, n, e,  ,  , s, e, c, o, n, d,  ]]
    
    
        third line

# anot
      
# another comment l
      [[f, i, r, s, t,  , d, e, f, i, n, i, t, i, o, n,  , l, i, n, e,  ,  , s, e, c, o, n, d,  ,  ,  , t, h, i, r, d,  , l, i, n, e]]
    
    
      
# another comment l
      
    
    
# another comment l
    [[f, i, r, s, t,  , d, e, f, i, n, i, t, i, o, n,  , l, i, n, e,  ,  , s, e, c, o, n, d,  ,  ,  , t, h, i, r, d,  , l, i, n, e]]
  
  
    
# another comment l
    
  
  
    
# another comment l
    # another comment li
    [[]]
  
  
    # another comment li
    
    [[ , a, n, o, t, h, e, r,  , c, o, m, m, e, n, t,  , l, i, n, e, !]]
  
  
    
    
  
  
    
    
  
  
    
    
      
      
    
    
  
  
  []

Success

Full code for reference:

#define BOOST_SPIRIT_DEBUG
#include 
#include 
#include 

#include 
#include 
#include 

namespace qi = boost::spirit::qi;

namespace termcxx { namespace parser {

    namespace ascii = boost::spirit::ascii;
    namespace px    = boost::phoenix;

    //using qi::double_;
    using ascii::blank;
    //using px::ref;
    using px::construct;

    //using qi::eps;
    //using qi::lit;
    using qi::_val;
    using qi::_1;
    using ascii::char_;
    using ascii::graph;
    using qi::eol;
    using qi::eoi;

    struct context
    {
        int dummy;

        context () = default;
        context (context const &) = default;
        context (std::vector a) { }
        context (std::vector a, std::vector b) { }
    };

} }

BOOST_FUSION_ADAPT_STRUCT(termcxx::parser::context, (int, dummy))

namespace termcxx { namespace parser {

    template 
    struct parser : qi::grammar
    {
        parser() : parser::base_type(start)
        { 
            empty_line          = *blank >> eol;
            comment_line        = *blank >> '#' >> *(char_ - eol) >> (eol|eoi);
            def_first_line      = graph >> +(char_ - eol)         >> (eol|eoi);
            def_subsequent_line = +blank >> +(char_ - eol)        >> (eol|eoi);

            definition          = (def_first_line >> *def_subsequent_line);

            start               = (  
                                    *(comment_line | empty_line | definition)
                                  ) [ _val = px::construct() ]
                                  ;

            BOOST_SPIRIT_DEBUG_NODES((start)(def_first_line)(def_subsequent_line)(definition)(empty_line)(comment_line))
        }

      private:
        qi::rule start;
        qi::rule comment_line;
        qi::rule empty_line;
        qi::rule def_first_line;
        qi::rule def_subsequent_line;
        qi::rule definition;
    };

} }

int main()
{
    using It = boost::spirit::istream_iterator;
    termcxx::parser::parser g;

    It f(std::cin >> std::noskipws), l;
    termcxx::parser::context data;
    if (qi::parse(f,l,g,data))
        std::cout << "Success
";
    else
        std::cout << "Failure
";

    if (f != l)
        std::cout << "Remaining input: '" << std::string(f,l) << "'
";
}

Boost.Spirit grammar issue

Answers (2)

Related Questions