我正在为一种输入文件编写解析器。输入文件类似于:
[CalculationBlock]
CalculationTitle="Test Parser Input System" , MatchingRadius=25.0, StepSize=0.01,ProblemType=RelSchroedingerEqn
MaxPartialWaveJ=800, SMatConv=10E-8
PartialWaveConv= 10E-8, SmallValueLimit = 10E-8
PotentialRadType=HeavyIon
[end]
本质上,它分为以[BlockName]
开头的块,然后在其中包含一组命名参数。命名参数可以用','
或'\n'
个字符分隔。
使用我上面提到的不完整的输入文件,我想为它编写一个解析器,它将作为更完整输入文件的跳转点。我这样做但解析器有一个弱点,我不知道如何解决。它不是参数顺序独立的。例如,如果用户要将参数PartialWaveConv= 10E-8
放在SMatConv=10E-8
之前,则会失败。
我简单地考虑枚举一个块中参数的每个可能顺序,但我放弃了它,因为有n个参数值对的n!
个排列。 所以我的问题是:有没有办法让解析器独立于参数排序?
我写的玩具解析器如下,我道歉,如果它是业余的,这是我第一次进入boost
,更不用说boost.spirit
。
#include<string>
#include<iostream>
#include<cstdlib>
#include<fstream>
#include<boost/config/warning_disable.hpp>
#include<boost/spirit/include/qi.hpp>
#include<boost/spirit/include/phoenix_core.hpp>
#include<boost/spirit/include/phoenix_operator.hpp>
#include<boost/spirit/include/phoenix_object.hpp>
#include<boost/fusion/include/adapt_struct.hpp>
#include<boost/fusion/include/io.hpp>
#include<boost/spirit/include/support_istream_iterator.hpp>
namespace blocks
{
namespace qi = boost::spirit::qi;
namespace ascii = boost::spirit::ascii;
namespace phoenix = boost::phoenix;
struct CalcBlock
{
std::string calculationTitle;
float matchingRad;
float stepSize;
std::string problemType;
int maxPartialWaveJ;
float sMatrixConvergenceValue;
float partialWaveConvergenceValue;
float smallValueLimit;
std::string potentialRadType;
};
}
//tell fusion about the block structure
BOOST_FUSION_ADAPT_STRUCT(blocks::CalcBlock,
(std::string, calculationTitle)
(float, matchingRad)
(float, stepSize)
(std::string, problemType)
(int, maxPartialWaveJ)
(float, sMatrixConvergenceValue)
(float, partialWaveConvergenceValue)
(float, smallValueLimit)
(std::string, potentialRadType)
)
namespace blocks
{
template <typename Iterator>
struct CalcBlockParser : qi::grammar<Iterator, CalcBlock(), boost::spirit::ascii::blank_type>
{
CalcBlockParser() : CalcBlockParser::base_type(start)
{
using qi::int_;
using qi::lit;
using qi::float_;
using qi::lexeme;
using ascii::char_;
quotedString %= lexeme['"' >> +(char_ - '"' - '\n') >> '"'];
plainString %= lexeme[ +(char_ - ' ' - ',' - '\n') ];
start %=
lit("[CalculationBlock]") >> '\n'
>> lit("CalculationTitle") >> '=' >> quotedString >> (lit(',') | lit('\n'))
>> lit("MatchingRadius") >> '=' >> float_ >> (lit(',') | lit('\n'))
>> lit("StepSize") >> '=' >> float_ >> (lit(',') | lit('\n'))
>> lit("ProblemType") >> '=' >> plainString >> (lit(',') | lit('\n'))
>> lit("MaxPartialWaveJ") >> '=' >> int_ >> (lit(',') | lit('\n'))
>> lit("SMatConv") >> '=' >> float_ >> (lit(',') | lit('\n'))
>> lit("PartialWaveConv") >> '=' >> float_ >> (lit(',') | lit('\n'))
>> lit("SmallValueLimit") >> '=' >> float_ >> (lit(',') | lit('\n'))
>> lit("PotentialRadType") >> '=' >> plainString
>> lit("\n[end]\n");
}
qi::rule<Iterator, std::string(), boost::spirit::ascii::blank_type> quotedString;
qi::rule<Iterator, std::string(), boost::spirit::ascii::blank_type> plainString;
qi::rule<Iterator, CalcBlock(), boost::spirit::ascii::blank_type> start;
};
}
using std::cout;
using std::endl;
namespace spirit = boost::spirit;
int main(int argc, char *argv[])
{
if (argc != 2)
{
cout << "\nUsage:\n\t./echos InputFileName\n" << endl;
return EXIT_FAILURE;
}
std::string inputFileName(argv[1]);
cout << "Reading input from the file: " << inputFileName << endl;
std::ifstream input(inputFileName);
input.unsetf(std::ios::skipws);
spirit::istream_iterator start(input);
spirit::istream_iterator stop;
typedef blocks::CalcBlockParser<spirit::istream_iterator> CalcBlockParser;
CalcBlockParser cbParser;
blocks::CalcBlock cb;
bool success = phrase_parse(start, stop, cbParser, boost::spirit::ascii::blank, cb);
if (success && start == stop)
{
std::cout << boost::fusion::tuple_open('[');
std::cout << boost::fusion::tuple_close(']');
std::cout << boost::fusion::tuple_delimiter(", ");
std::cout << "-------------------------\n";
std::cout << "Parsing succeeded\n";
std::cout << "got: " << boost::fusion::as_vector(cb) << std::endl;
std::cout << "\n-------------------------\n";
}
else
{
std::cout << boost::fusion::tuple_open('[');
std::cout << boost::fusion::tuple_close(']');
std::cout << boost::fusion::tuple_delimiter(", ");
std::cout << "-------------------------\n";
std::cout << "Parsing failed\n";
std::cout << "got: " << boost::fusion::as_vector(cb) << std::endl;
std::cout << "\n-------------------------\n";
}
return EXIT_SUCCESS;
}
答案 0 :(得分:5)
为了好玩/完整,我查看了语法并提出了以下测试。
我已经做了一些左右改进的建议(正如OP在直播中见到的那样),结果代码,测试和输出都在这里:
<强> Live On Coliru 强>
#include <boost/fusion/include/adapt_struct.hpp>
#include <boost/spirit/include/qi.hpp>
#include <fstream>
#include <iostream>
namespace blocks {
struct CalcBlock {
std::string calculationTitle;
float matchingRad;
float stepSize;
std::string problemType;
int maxPartialWaveJ;
float sMatrixConvergenceValue;
float partialWaveConvergenceValue;
float smallValueLimit;
std::string potentialRadType;
};
}
BOOST_FUSION_ADAPT_STRUCT(blocks::CalcBlock, // Boost 1.58+ style adapt-struct
calculationTitle, matchingRad, stepSize, problemType, maxPartialWaveJ,
sMatrixConvergenceValue, partialWaveConvergenceValue, smallValueLimit,
potentialRadType)
namespace blocks {
namespace qi = boost::spirit::qi;
template <typename Iterator>
struct CalcBlockParser : qi::grammar<Iterator, CalcBlock()> {
CalcBlockParser() : CalcBlockParser::base_type(start) {
using namespace qi;
auto eol_ = copy((',' >> *eol) | +eol); // http://stackoverflow.com/a/26411266/85371 (!)
quotedString = '"' >> +~char_("\"\n") >> '"';
plainString = +~char_(" ,\n");
start = skip(blank) [cbRule];
cbRule = lexeme["[CalculationBlock]"] >> eol
>> (
(lexeme["CalculationTitle"] >> '=' >> quotedString >> eol_)
^ (lexeme["MatchingRadius"] >> '=' >> float_ >> eol_)
^ (lexeme["StepSize"] >> '=' >> float_ >> eol_)
^ (lexeme["ProblemType"] >> '=' >> plainString >> eol_)
^ (lexeme["MaxPartialWaveJ"] >> '=' >> int_ >> eol_)
^ (lexeme["SMatConv"] >> '=' >> float_ >> eol_)
^ (lexeme["PartialWaveConv"] >> '=' >> float_ >> eol_)
^ (lexeme["SmallValueLimit"] >> '=' >> float_ >> eol_)
^ (lexeme["PotentialRadType"] >> '=' >> plainString >> eol_)
)
>> lexeme["[end]"]
>> *eol
>> eoi;
}
private:
qi::rule<Iterator, CalcBlock()> start;
qi::rule<Iterator, CalcBlock(), qi::blank_type> cbRule;
// lexemes:
qi::rule<Iterator, std::string()> quotedString, plainString;
};
}
using boost::fusion::as_vector;
typedef boost::spirit::istream_iterator It;
int main(int argc, char **argv) {
if (argc != 2) {
std::cout << "Usage:\n\t" << argv[0] << " InputFileName" << std::endl;
return 1;
}
std::string inputFileName(argv[1]);
std::cout << "Reading input from the file: " << inputFileName << std::endl;
std::ifstream input(inputFileName);
input.unsetf(std::ios::skipws);
It start(input), stop;
blocks::CalcBlock cb;
blocks::CalcBlockParser<It> cbParser;
bool success = parse(start, stop, cbParser, cb);
{
using namespace boost::fusion;
std::cout << tuple_open('[') << tuple_close(']') << tuple_delimiter(", ");
}
std::cout << "-------------------------\n";
std::cout << "Parsing " << (success?"succeeded":"failed") << "\n";
std::cout << "got: " << as_vector(cb) << "\n";
std::cout << "-------------------------\n";
}
输入:
[CalculationBlock]
CalculationTitle="Test Parser Input System"
SMatConv=10E-8,
PartialWaveConv= 10E-8, MaxPartialWaveJ=800, SmallValueLimit = 10E-8
PotentialRadType=HeavyIon , MatchingRadius=25.0, StepSize=0.01,ProblemType=RelSchroedingerEqn
[end]
输出:
Reading input from the file: input.txt
-------------------------
Parsing succeeded
got: [Test Parser Input System, 25, 0.01, RelSchroedingerEqn, 800, 1e-07, 1e-07, 1e-07, HeavyIon]
-------------------------
答案 1 :(得分:3)
您必须使用排列运算符^
:
start %=
lit("[CalculationBlock]") >> '\n' >>
(
(lit("CalculationTitle") >> '=' >> quotedString >> (lit(',') | lit)('\n')))
^ (lit("MatchingRadius") >> '=' >> float_ >> (lit(',') | lit('\n')))
^ (lit("StepSize") >> '=' >> float_ >> (lit(',') | lit('\n')))
^ (lit("ProblemType") >> '=' >> plainString >> (lit(',') | lit('\n')))
^ (lit("MaxPartialWaveJ") >> '=' >> int_ >> (lit(',') | lit('\n')))
^ (lit("SMatConv") >> '=' >> float_ >> (lit(',') | lit('\n')))
^ (lit("PartialWaveConv") >> '=' >> float_ >> (lit(',') | lit('\n')))
^ (lit("SmallValueLimit") >> '=' >> float_ >> (lit(',') | lit('\n')))
^ (lit("PotentialRadType") >> '=' >> plainString >> (lit(',') | lit('\n')))
)
>> lit("\n[end]\n");