3

我目前正在尝试使用完成一些工作,boost::spirit::qi::phrase_parse但我无法自己解决这个问题。

值得一提的是:我对 boost 和 boost::spirit 完全陌生。

我收到了表单的输入"{A [B C] -> F [D E], C ->E,B->Z}"

我想将这种类型的输入解析为std::map<std::string, std::string>. 键应该保持std::string在之前的每一个和每一个之后"->"的值,直到发生。std::string"->"','

此外'['']'不应存储 and 。

所以std::map解析成功后的内容应该是这样的:

     {
       ("A", "F"),
       ("A", "D E"),
       ("B C", "F"),
       ("B C", "D E"),
       ("C", "E"),
       ("B", "Z")
     }

我的第一种方法是将所有键/值存储在std::vector<std::string>.

    #include <boost/spirit/include/qi.hpp>

    #include <iostream>
    #include <string>
    #include <vector>

    int main()
    {
        using boost::spirit::qi::phrase_parse;
        using boost::spirit::qi::char_;
        using boost::spirit::qi::lexeme;

        std::string input = "{A [B C] -> F [D E], C    ->E,B->Z}";
        std::string::const_iterator beg = input.begin(), end = input.end();

        std::vector<std::string> sdvec;

        bool r = phrase_parse(  beg, 
                                end,
                                '{' >> (+(+char_("a-zA-Z0-9") | lexeme[('[' >> +char_("a-zA-Z0-9 ") >> ']')]) >> '-' >> '>' >> +(+char_("a-zA-Z0-9") | lexeme[('[' >> +char_("a-zA-Z0-9 ") >> ']')])) % ',' >> '}',
                                boost::spirit::ascii::space,
                                sdvec
                           );

        if(beg != end) {
            std::cout << "Parsing failed!" << std::endl;
        } else {
            std::cout << "Parsing succeeded!" << std::endl;    
        }

        for(int i=0; i<sdvec.size(); i++) {
            std::cout << i << ": " << sdvec[i] << std::endl;
        }

        return 0;
    }

执行此操作,我将每个都std::string作为以下条目找到std::vector

    Parsing 2 succeeded!
    0: A
    1: B C
    2: F
    3: D E
    4: C
    5: E
    6: B
    7: Z

但我不知道如何将这些值解析为std::map<std::string, std::string>使用boost::spirit::qi::phrase_parse,因为简单地替换会引发一些编译错误。

编辑:

实际上我发现了一些我需要的东西:http: //boost-spirit.com/home/articles/qi-example/parsing-a-list-of-key-value-pairs-using-spirit-qi/

我根据自己的问题采用了这篇文章的代码:

    #include <boost/spirit/include/qi.hpp>
    #include <boost/fusion/include/std_pair.hpp>

    #include <iostream>
    #include <string>
    #include <vector>
    #include <map>

    namespace qi = boost::spirit::qi;

    template <typename Iterator>
    struct keys_and_values
      : qi::grammar<Iterator, std::map<std::string, std::string>()>
    {
        keys_and_values()
          : keys_and_values::base_type(query)
        {
            query =  '{' >> *qi::lit(' ') >> pair >> *(qi::lit(',') >> *qi::lit(' ') >> pair) >> *qi::lit(' ') >> '}';
            pair  =  key >> -(*qi::lit(' ') >> "->" >> *qi::lit(' ') >> value);
            key   =  +qi::char_("a-zA-Z0-9") | qi::lexeme[('[' >> +qi::char_("a-zA-Z0-9 ") >> ']')];
            value = +qi::char_("a-zA-Z0-9") | qi::lexeme[('[' >> +qi::char_("a-zA-Z0-9 ") >> ']')];
        }
        qi::rule<Iterator, std::map<std::string, std::string>()> query;
        qi::rule<Iterator, std::pair<std::string, std::string>()> pair;
        qi::rule<Iterator, std::string()> key, value;
    };

    int main()
    {
        std::string input = "{AB -> CD, E -> F, G -> HI, [J K L] -> [M N O]                   }";

        std::string::iterator begin = input.begin();
        std::string::iterator end = input.end();

        keys_and_values<std::string::iterator> p;    // create instance of parser
        std::map<std::string, std::string> m;        // map to receive results
        bool result = qi::phrase_parse(begin, end, p, boost::spirit::ascii::space, m);   // returns true if successful

        if(begin != end) {
            std::cout << "Parsing failed!" << std::endl;
        } else {
            std::cout << "Parsing succeeded!" << std::endl;    
        }

        std::cout << m["AB"] << "\t" << m["E"] << "\t" << m["G"] << "\t" << m["J K L"] << std::endl;

        return 0;
    }

这样做的结果或多或少是我需要的:

Parsing succeeded!
CD  F   HI  M N O

我要解决的最后一个问题是类似A [B C] -> F [D E].

有什么方法可以将它们作为四个单独的键值对("A", "F"), ("A", "D E"), ("B C", "F"), ("B C", "D E")放入我的std::map<std::string, std::string> m

或者也许更容易将其解析为std::map<std::vector<std::string>, std::vector<std::string> >每个都std::vector<std::string>包含所有键/值的位置?

例如:

in: "{A [B C] -> F [D E], C ->E,B->Z}"
out: { ({"A", "B C"}, {"F", "D E"}), ({"C"}, {"E"}), ({"B"}, {"Z"}) }

谢谢你的帮助!

4

2 回答 2

4

我认为你非常接近你的目标,所以我将跳过组合部分:-) 解析器将做它应该做的事情......检查语法并标记数据,然后它传递键、值和输出映射( multimap ) 参数到 phoenix 函数inserter中,您可以在其中插入whatever您需要的地图 ( multimap )

#if __cplusplus >= 201103L
#define BOOST_RESULT_OF_USE_DECLTYPE
#endif
#define BOOST_SPIRIT_USE_PHOENIX_V3
#include <boost/spirit/include/qi.hpp>
#include <boost/spirit/include/phoenix.hpp>
#include <iostream>
#include <algorithm>
#include <iterator>
#include <iomanip>
#include <vector>
#include <map>

namespace qi = boost::spirit::qi;
namespace ascii=boost::spirit::ascii;

typedef std::map< std::string,std::string > TMap;
//typedef std::multimap< std::string,std::string > TMap;

struct SMapInsert
{
    template <typename Arg1,typename Arg2,typename Arg3>
    struct result
    {
        typedef void type;
    };

    template <typename Arg1,typename Arg2,typename Arg3>
    void operator()( Arg1&out, Arg2&keys, Arg3&vals ) const
    {
        std::cout << "Keys:" << std::endl;
        for( const auto &key : keys )
            std::cout << std::left << "`" << key << "`" << std::endl;
        std::cout << "Vals:" << std::endl;
        for( const auto &val : vals )
            std::cout << std::left << "`" << val << "`" << std::endl;
        // your map here...
        // out.insert
    }
};

boost::phoenix::function< SMapInsert > inserter;

int main()
{
    std::string input = "{A [B C] -> F [D E], C ->E,B->Z}";
    TMap data;

    std::string::const_iterator iter = input.begin();
    std::string::const_iterator last = input.end();

    qi::rule< std::string::const_iterator,std::string() > token=+qi::alnum;
    qi::rule< std::string::const_iterator,ascii::space_type,std::vector< std::string >() > 
        keyOrvalue = +( token  | ( '[' >> qi::lexeme[ +qi::char_("a-zA-Z0-9 ") ] >> ']' ) );
    qi::rule< std::string::const_iterator,ascii::space_type, TMap() > 
        root = '{' >> ( ( keyOrvalue >> "->" >> keyOrvalue )[ inserter( qi::_val, qi::_1, qi::_2 ) ] ) % ',' >> '}';
    std::cout << "input: `" << input << "`" << std::endl;
    if( qi::phrase_parse( iter, last, root, ascii::space, data ) && iter==last )
    {
        for( const auto &keyValue : data )
            std::cout << std::left << std::setw(10) << keyValue.first << std::setw(10) << keyValue.second << std::endl;
    } 
    else
        std::cout << "parsing failed:" << std::string( iter,last ) << std::endl;        

    return 0;
}
于 2013-09-03T07:37:44.037 回答
3

编辑:这是一种替代方法,但我认为它比 G. Civardi 的解决方案要清晰得多。

正如您所观察到的,解析为 amap<vector<string>,vector<string>>将是最简单的方法,您可以稍后对其进行操作以获得您真正想要的地图。下面的解决方案使用中间结构(基本上等同于map<vector,vector>),然后使用自定义点transform_attribute来填充多重映射(因为有重复的键)。
PS:请原谅使用基于范围的for循环,如果你不能使用c ++ 11,请更改它们。

在大肠杆菌上运行

#define BOOST_SPIRIT_DEBUG

#include <boost/spirit/include/qi.hpp>
#include <boost/fusion/include/adapt_struct.hpp>

#include <iostream>
#include <string>
#include <vector>
#include <map>

namespace qi=boost::spirit::qi;
namespace ascii=boost::spirit::ascii;

struct key_value
{
    std::vector<std::string> keys;
    std::vector<std::string> values;
};

struct intermediate_struct
{
    std::vector<key_value> data;
};

BOOST_FUSION_ADAPT_STRUCT(
    key_value,
    (std::vector<std::string>, keys)
    (std::vector<std::string>, values)
)

BOOST_FUSION_ADAPT_STRUCT(
    intermediate_struct,
    (std::vector<key_value>, data)
)

namespace boost{ namespace spirit{ namespace traits
{

    template <>
    struct transform_attribute<std::multimap<std::string,std::string>,intermediate_struct,qi::domain>
    {
        typedef intermediate_struct type;

        static type pre(std::multimap<std::string,std::string>& )
        { 
            return intermediate_struct();
        }
        static void post(std::multimap<std::string,std::string>& map, intermediate_struct const& intermediate)
        {
            for(const auto& key_val : intermediate.data)
            {
                for(const auto& key : key_val.keys)
                {
                    for(const auto& val : key_val.values)
                    {
                        map.insert(typename std::multimap<std::string,std::string>::value_type(key,val));
                    }
                } 
            }
        }  
        static void fail(std::multimap<std::string,std::string>&){} 
    };

}}}

int main()
{
    std::string input = "{A [B C] -> F [D E], C ->E,B->Z}";
    std::string::const_iterator iter = input.begin(), end = input.end();

    std::multimap<std::string,std::string> sdmap;

    qi::rule<std::string::const_iterator,std::string(),ascii::space_type> text_rule =
        +qi::char_("a-zA-Z0-9") | qi::lexeme[('[' >> +qi::char_("a-zA-Z0-9 ") >> ']')];
    qi::rule<std::string::const_iterator,std::vector<std::string>(),ascii::space_type> keys_rule =
        +text_rule;
    qi::rule<std::string::const_iterator,std::vector<std::string>(),ascii::space_type> values_rule =
        +text_rule;
    qi::rule<std::string::const_iterator,intermediate_struct(),ascii::space_type> map_rule =
        qi::eps >> ('{' >> (keys_rule >> "->" >> values_rule)%',' >> '}');

    BOOST_SPIRIT_DEBUG_NODES( (map_rule)(keys_rule)(values_rule) );

    bool r = qi::phrase_parse(  iter, 
                            end,
                            map_rule,
                            ascii::space,
                            sdmap
                        );

    if(r && (iter == end)) {
        std::cout << "Parsing succeeded!" << std::endl;
        for(const auto& pair : sdmap) {
            std::cout << pair.first << ": " << pair.second << std::endl;
        }
    } else {
        std::cout << "Parsing Failed!" << std::endl;   
        std::cout << "Unparsed: " << std::string(iter,end) << std::endl;
    }

    return 0;
}
于 2013-09-03T07:36:28.623 回答