test_icu.cpp

来自「Boost provides free peer-reviewed portab」· C++ 代码 · 共 650 行 · 第 1/2 页

CPP
650
字号
/* * * Copyright (c) 2004 * John Maddock * * Use, modification and distribution are subject to the  * Boost Software License, Version 1.0. (See accompanying file  * LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt) * */ /*  *   LOCATION:    see http://www.boost.org for most recent version.  *   FILE         test_icu.cpp  *   VERSION      see <boost/version.hpp>  *   DESCRIPTION: Test code for Unicode regexes with ICU support.  *///// We can only build this if we have ICU support://#include <boost/regex/config.hpp>#if defined(BOOST_HAS_ICU) && !defined(BOOST_NO_STD_WSTRING)#include <boost/regex/icu.hpp>#include "test.hpp"namespace unnecessary_fix{//// Some outrageously broken std lib's don't have a conforming// back_insert_iterator, which means we can't use the std version// as an argument to regex_replace, sigh... use our own://template <class Seq>class back_insert_iterator #ifndef BOOST_NO_STD_ITERATOR   : public std::iterator<std::output_iterator_tag,void,void,void,void>#endif{private:   Seq* container;public:   typedef const typename Seq::value_type value_type;   typedef Seq                  container_type;   typedef std::output_iterator_tag  iterator_category;   explicit back_insert_iterator(Seq& x) : container(&x) {}   back_insert_iterator& operator=(const value_type& val)    {       container->push_back(val);      return *this;   }   back_insert_iterator& operator*() { return *this; }   back_insert_iterator& operator++() { return *this; }   back_insert_iterator  operator++(int) { return *this; }};template <class Seq>inline back_insert_iterator<Seq> back_inserter(Seq& x) {   return back_insert_iterator<Seq>(x);}}//// compare two match_results struct's for equality,// converting the iterator as needed://template <class MR1, class MR2>void compare_result(const MR1& w1, const MR2& w2, boost::mpl::int_<2> const*){   typedef typename MR2::value_type MR2_value_type;   typedef typename MR2_value_type::const_iterator MR2_iterator_type;   typedef boost::u16_to_u32_iterator<MR2_iterator_type> iterator_type;   typedef typename MR1::size_type size_type;   if(w1.size() != w2.size())   {      BOOST_REGEX_TEST_ERROR("Size mismatch in match_results class", UChar32);   }   for(int i = 0; i < (int)w1.size(); ++i)   {      if(w1[i].matched)      {         if(w2[i].matched == 0)         {            BOOST_REGEX_TEST_ERROR("Matched mismatch in match_results class", UChar32);         }         if((w1.position(i) != boost::re_detail::distance(iterator_type(w2.prefix().first), iterator_type(w2[i].first))) || (w1.length(i) != boost::re_detail::distance(iterator_type(w2[i].first), iterator_type(w2[i].second))))         {            BOOST_REGEX_TEST_ERROR("Iterator mismatch in match_results class", UChar32);         }      }      else if(w2[i].matched)      {         BOOST_REGEX_TEST_ERROR("Matched mismatch in match_results class", UChar32);      }   }}template <class MR1, class MR2>void compare_result(const MR1& w1, const MR2& w2, boost::mpl::int_<1> const*){   typedef typename MR2::value_type MR2_value_type;   typedef typename MR2_value_type::const_iterator MR2_iterator_type;   typedef boost::u8_to_u32_iterator<MR2_iterator_type> iterator_type;   typedef typename MR1::size_type size_type;   if(w1.size() != w2.size())   {      BOOST_REGEX_TEST_ERROR("Size mismatch in match_results class", UChar32);   }   for(int i = 0; i < (int)w1.size(); ++i)   {      if(w1[i].matched)      {         if(w2[i].matched == 0)         {            BOOST_REGEX_TEST_ERROR("Matched mismatch in match_results class", UChar32);         }         if((w1.position(i) != boost::re_detail::distance(iterator_type(w2.prefix().first), iterator_type(w2[i].first))) || (w1.length(i) != boost::re_detail::distance(iterator_type(w2[i].first), iterator_type(w2[i].second))))         {            BOOST_REGEX_TEST_ERROR("Iterator mismatch in match_results class", UChar32);         }      }      else if(w2[i].matched)      {         BOOST_REGEX_TEST_ERROR("Matched mismatch in match_results class", UChar32);      }   }}void test_icu_grep(const boost::u32regex& r, const std::vector< ::UChar32>& search_text){   typedef std::vector< ::UChar32>::const_iterator const_iterator;   typedef boost::u32regex_iterator<const_iterator> test_iterator;   boost::regex_constants::match_flag_type opts = test_info<wchar_t>::match_options();   const int* answer_table = test_info<wchar_t>::answer_table();   test_iterator start(search_text.begin(), search_text.end(), r, opts), end;   test_iterator copy(start);   const_iterator last_end = search_text.begin();   while(start != end)   {      if(start != copy)      {         BOOST_REGEX_TEST_ERROR("Failed iterator != comparison.", wchar_t);      }      if(!(start == copy))      {         BOOST_REGEX_TEST_ERROR("Failed iterator == comparison.", wchar_t);      }      test_result(*start, search_text.begin(), answer_table);      // test $` and $' :      if(start->prefix().first != last_end)      {         BOOST_REGEX_TEST_ERROR("Incorrect position for start of $`", wchar_t);      }      if(start->prefix().second != (*start)[0].first)      {         BOOST_REGEX_TEST_ERROR("Incorrect position for end of $`", wchar_t);      }      if(start->prefix().matched != (start->prefix().first != start->prefix().second))      {         BOOST_REGEX_TEST_ERROR("Incorrect position for matched member of $`", wchar_t);      }      if(start->suffix().first != (*start)[0].second)      {         BOOST_REGEX_TEST_ERROR("Incorrect position for start of $'", wchar_t);      }      if(start->suffix().second != search_text.end())      {         BOOST_REGEX_TEST_ERROR("Incorrect position for end of $'", wchar_t);      }      if(start->suffix().matched != (start->suffix().first != start->suffix().second))      {         BOOST_REGEX_TEST_ERROR("Incorrect position for matched member of $'", wchar_t);      }      last_end = (*start)[0].second;      ++start;      ++copy;      // move on the answer table to next set of answers;      if(*answer_table != -2)         while(*answer_table++ != -2){}   }   if(answer_table[0] >= 0)   {      // we should have had a match but didn't:      BOOST_REGEX_TEST_ERROR("Expected match was not found.", wchar_t);   }}void test_icu(const wchar_t&, const test_regex_search_tag& ){   boost::u32regex r;   if(*test_locale::c_str())   {      U_NAMESPACE_QUALIFIER Locale l(test_locale::c_str());      if(l.isBogus())         return;      r.imbue(l);   }   std::vector< ::UChar32> expression;#ifndef BOOST_NO_TEMPLATED_ITERATOR_CONSTRUCTORS   expression.assign(test_info<wchar_t>::expression().begin(), test_info<wchar_t>::expression().end());#else   std::copy(test_info<wchar_t>::expression().begin(), test_info<wchar_t>::expression().end(), std::back_inserter(expression));#endif   boost::regex_constants::syntax_option_type syntax_options = test_info<UChar32>::syntax_options();   try{#if !defined(BOOST_NO_MEMBER_TEMPLATES) && !defined(__IBMCPP__)      r.assign(expression.begin(), expression.end(), syntax_options);#else      if(expression.size())         r.assign(&*expression.begin(), expression.size(), syntax_options);      else         r.assign(static_cast<UChar32 const*>(0), expression.size(), syntax_options);#endif      if(r.status())      {         BOOST_REGEX_TEST_ERROR("Expression did not compile when it should have done, error code = " << r.status(), UChar32);      }      std::vector< ::UChar32> search_text;#ifndef BOOST_NO_TEMPLATED_ITERATOR_CONSTRUCTORS      search_text.assign(test_info<wchar_t>::search_text().begin(), test_info<wchar_t>::search_text().end());#else      std::copy(test_info<wchar_t>::search_text().begin(), test_info<wchar_t>::search_text().end(), std::back_inserter(search_text));#endif      boost::regex_constants::match_flag_type opts = test_info<wchar_t>::match_options();      const int* answer_table = test_info<wchar_t>::answer_table();      boost::match_results<std::vector< ::UChar32>::const_iterator> what;      if(boost::u32regex_search(         const_cast<std::vector< ::UChar32>const&>(search_text).begin(),         const_cast<std::vector< ::UChar32>const&>(search_text).end(),         what,         r,         opts))      {         test_result(what, const_cast<std::vector< ::UChar32>const&>(search_text).begin(), answer_table);      }      else if(answer_table[0] >= 0)      {         // we should have had a match but didn't:         BOOST_REGEX_TEST_ERROR("Expected match was not found.", UChar32);      }      if(0 == *test_locale::c_str())      {         //         // Now try UTF-16 construction:         //         typedef boost::u32_to_u16_iterator<std::vector<UChar32>::const_iterator> u16_conv;         std::vector<UChar> expression16, text16;         boost::match_results<std::vector<UChar>::const_iterator> what16;         boost::match_results<const UChar*> what16c;#ifndef BOOST_NO_TEMPLATED_ITERATOR_CONSTRUCTORS         expression16.assign(u16_conv(expression.begin()), u16_conv(expression.end()));         text16.assign(u16_conv(search_text.begin()), u16_conv(search_text.end()));#else         expression16.clear();         std::copy(u16_conv(expression.begin()), u16_conv(expression.end()), std::back_inserter(expression16));         text16.clear();         std::copy(u16_conv(search_text.begin()), u16_conv(search_text.end()), std::back_inserter(text16));#endif         r = boost::make_u32regex(expression16.begin(), expression16.end(), syntax_options);         if(boost::u32regex_search(const_cast<const std::vector<UChar>&>(text16).begin(), const_cast<const std::vector<UChar>&>(text16).end(), what16, r, opts))         {            compare_result(what, what16, static_cast<boost::mpl::int_<2> const*>(0));         }         else if(answer_table[0] >= 0)         {            // we should have had a match but didn't:            BOOST_REGEX_TEST_ERROR("Expected match was not found.", UChar32);         }         if(std::find(expression16.begin(), expression16.end(), 0) == expression16.end())         {            expression16.push_back(0);            r = boost::make_u32regex(&*expression16.begin(), syntax_options);            if(std::find(text16.begin(), text16.end(), 0) == text16.end())            {               text16.push_back(0);               if(boost::u32regex_search((const UChar*)&*text16.begin(), what16c, r, opts))               {                  compare_result(what, what16c, static_cast<boost::mpl::int_<2> const*>(0));               }               else if(answer_table[0] >= 0)               {                  // we should have had a match but didn't:                  BOOST_REGEX_TEST_ERROR("Expected match was not found.", UChar32);               }            }         }         //         // Now try UTF-8 construction:         //         typedef boost::u32_to_u8_iterator<std::vector<UChar32>::const_iterator, unsigned char> u8_conv;         std::vector<unsigned char> expression8, text8;         boost::match_results<std::vector<unsigned char>::const_iterator> what8;         boost::match_results<const unsigned char*> what8c;#ifndef BOOST_NO_TEMPLATED_ITERATOR_CONSTRUCTORS         expression8.assign(u8_conv(expression.begin()), u8_conv(expression.end()));         text8.assign(u8_conv(search_text.begin()), u8_conv(search_text.end()));#else         expression8.clear();         std::copy(u8_conv(expression.begin()), u8_conv(expression.end()), std::back_inserter(expression8));         text8.clear();         std::copy(u8_conv(search_text.begin()), u8_conv(search_text.end()), std::back_inserter(text8));#endif         r = boost::make_u32regex(expression8.begin(), expression8.end(), syntax_options);         if(boost::u32regex_search(const_cast<const std::vector<unsigned char>&>(text8).begin(), const_cast<const std::vector<unsigned char>&>(text8).end(), what8, r, opts))         {            compare_result(what, what8, static_cast<boost::mpl::int_<1> const*>(0));         }         else if(answer_table[0] >= 0)         {            // we should have had a match but didn't:            BOOST_REGEX_TEST_ERROR("Expected match was not found.", UChar32);         }         if(std::find(expression8.begin(), expression8.end(), 0) == expression8.end())         {            expression8.push_back(0);            r = boost::make_u32regex(&*expression8.begin(), syntax_options);            if(std::find(text8.begin(), text8.end(), 0) == text8.end())            {               text8.push_back(0);               if(boost::u32regex_search((const unsigned char*)&*text8.begin(), what8c, r, opts))               {

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?