Boost正则表达式,如何提取网页中所有加粗的文字?
要提取的内容如下:
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"><html xmlns="http://www.w3.org/1999/xhtml"><head><meta http-equiv="Content-Type" content="text/html; charset=gb2312" /><title>无标题文档</title></head><body><strong>1</strong> <strong>2</strong> <strong>safd</strong> sdfsf <strong>aaa</strong> bbb 23 <strong>2324</strong> acc</body></html>
<strong>(.*?)</strong>
[解决办法]
#include <boost/regex.hpp>#include <iostream>int main(){ boost::regex::basic_regex reg("<strong>(.*?)</strong>"); char const* str = "<strong>1</strong> <strong>2</strong> <strong>safd</strong> sdfsf <strong>aaa</strong> bbb 23 <strong>2324</strong> acc"; boost::regex_iterator<char const*> iter(str, str + strlen(str), reg), end; for(; iter != end; ++iter) std::cout << iter->str() << std::endl;}