我的程序不識別中文。 如何用精神來認識中國人? 我使用wstring
並將其轉換爲utf-16。如何使用Boost Spirit解析中文(unicode utf-16)?
這裏是我的頭文件:
#pragma once
#define BOOST_SPIRIT_UNICODE
#include <boost/spirit/include/qi.hpp>
#include <string>
#include <vector>
#include <map>
using namespace std;
namespace qi = boost::spirit::qi;
namespace ascii = boost::spirit::ascii;
typedef pair<wstring,wstring> WordMeaningType;
typedef vector<WordMeaningType> WordMeaningsType;
typedef pair<wstring,WordMeaningsType> WordType;
typedef vector<WordType> WordListType;
struct WordPaser
:qi::grammar<wstring::iterator,WordListType(),ascii::space_type >
{
public:
qi::rule<wstring::iterator, wstring(),ascii::space_type> mRuleWordPart;
qi::rule<wstring::iterator, wstring(),ascii::space_type> mRuleWordMeaning;
qi::rule<wstring::iterator, wstring(),ascii::space_type> mRuleWord;
qi::rule<wstring::iterator, WordMeaningType(),ascii::space_type> mRulePM;
qi::rule<wstring::iterator, WordMeaningsType(),ascii::space_type> mRulePMs;
qi::rule<wstring::iterator, WordType(),ascii::space_type> mRuleCurWPM;
qi::rule<wstring::iterator, WordListType(),ascii::space_type> mRuleEntrence;
wstring mCurWord;
wstring mCurWordPart;
wstring mCurWordMeaning;
WordMeaningType mCurPM;
WordMeaningsType mCurPMs;
WordType mCurWPM;
WordPaser();
};
和我的CPP文件:
#include <boost/tuple/tuple.hpp>
#include <boost/spirit/include/qi.hpp>
#include <boost/spirit/include/phoenix.hpp>
#include "WordPaser.h"
namespace fusion = boost::fusion;
namespace phoenix = boost::phoenix;
using qi::_val;
using qi::_1;
using qi::_2;
using qi::lit;
using qi::lexeme;
using qi::space;
using ascii::char_;
using ascii::string;
using qi::graph;
using qi::word;
WordPaser::WordPaser()
: WordPaser::base_type(mRuleEntrence)
{
mRuleWord %= lexeme[(+((qi::alpha)[std::wcout<<L'|'<<_1])>>*(qi::alpha|char_('(')|char_(')')))];
mRuleWordPart %= lexeme[(+(qi::alpha)[std::wcout<<L'@'<<_1]>>*(qi::alpha|char_('/')|char_('.'))[std::wcout<<L'@'<<_1])];
mRuleWordMeaning %= lexeme[(+(qi::graph|char_(L'(')|char_(L')')[std::wcout<<L':'<<_1]))];
mRulePM = (mRuleWordPart>>mRuleWordMeaning)
[
phoenix::bind(&WordMeaningType::first, _val)=_1,
phoenix::bind(&WordMeaningType::second, _val)=_2
];
mRulePMs = +(mRulePM
[
phoenix::push_back( _val , _1)
]);
mRuleCurWPM = (mRuleWord>>mRulePMs)
[
phoenix::bind(&WordType::first, _val)=_1,
phoenix::bind(&WordType::second, _val)=_2
];
mRuleEntrence = +mRuleCurWPM
[
phoenix::push_back(_val, _1)
];
}
請至少指定樣本輸入和預期輸出。這裏沒有問題,現在 – sehe 2012-03-25 20:38:06