// Boost tokenizer examples -------------------------------------------------// // (c) Copyright John R. Bandela 2001. // Distributed under the Boost Software License, Version 1.0. (See // accompanying file LICENSE_1_0.txt or copy at // http://www.boost.org/LICENSE_1_0.txt) // See http://www.boost.org for updates, documentation, and revision history. #include #include #include #include #include #include #include int main() { using namespace boost; // Use tokenizer { const std::string test_string = ";;Hello|world||-foo--bar;yow;baz|"; std::string answer[] = { "Hello", "world", "foo", "bar", "yow", "baz" }; typedef tokenizer > Tok; char_separator sep("-;|"); Tok t(test_string, sep); BOOST_TEST(std::equal(t.begin(),t.end(),answer)); } { const std::string test_string = ";;Hello|world||-foo--bar;yow;baz|"; std::string answer[] = { "", "", "Hello", "|", "world", "|", "", "|", "", "foo", "", "bar", "yow", "baz", "|", "" }; typedef tokenizer > Tok; char_separator sep("-;", "|", boost::keep_empty_tokens); Tok t(test_string, sep); BOOST_TEST(std::equal(t.begin(), t.end(), answer)); } { const std::string test_string = "This,,is, a.test.."; std::string answer[] = {"This","is","a","test"}; typedef tokenizer<> Tok; Tok t(test_string); BOOST_TEST(std::equal(t.begin(),t.end(),answer)); } { const std::string test_string = "Field 1,\"embedded,comma\",quote \\\", escape \\\\"; std::string answer[] = {"Field 1","embedded,comma","quote \""," escape \\"}; typedef tokenizer > Tok; Tok t(test_string); BOOST_TEST(std::equal(t.begin(),t.end(),answer)); } { const std::string test_string = ",1,;2\\\";3\\;,4,5^\\,\'6,7\';"; std::string answer[] = {"","1","","2\"","3;","4","5\\","6,7",""}; typedef tokenizer > Tok; escaped_list_separator sep("\\^",",;","\"\'"); Tok t(test_string,sep); BOOST_TEST(std::equal(t.begin(),t.end(),answer)); } { const std::string test_string = "12252001"; std::string answer[] = {"12","25","2001"}; typedef tokenizer Tok; boost::array offsets = {{2,2,4}}; offset_separator func(offsets.begin(),offsets.end()); Tok t(test_string,func); BOOST_TEST(std::equal(t.begin(),t.end(),answer)); } // Use token_iterator_generator { const std::string test_string = "This,,is, a.test.."; std::string answer[] = {"This","is","a","test"}; typedef token_iterator_generator >::type Iter; Iter begin = make_token_iterator(test_string.begin(), test_string.end(),char_delimiters_separator()); Iter end; BOOST_TEST(std::equal(begin,end,answer)); } { const std::string test_string = "Field 1,\"embedded,comma\",quote \\\", escape \\\\"; std::string answer[] = {"Field 1","embedded,comma","quote \""," escape \\"}; typedef token_iterator_generator >::type Iter; Iter begin = make_token_iterator(test_string.begin(), test_string.end(),escaped_list_separator()); Iter begin_c(begin); Iter end; BOOST_TEST(std::equal(begin,end,answer)); while(begin_c != end) { BOOST_TEST(begin_c.at_end() == 0); ++begin_c; } BOOST_TEST(begin_c.at_end()); } { const std::string test_string = "12252001"; std::string answer[] = {"12","25","2001"}; typedef token_iterator_generator::type Iter; boost::array offsets = {{2,2,4}}; offset_separator func(offsets.begin(),offsets.end()); Iter begin = make_token_iterator(test_string.begin(), test_string.end(),func); Iter end= make_token_iterator(test_string.end(), test_string.end(),func); BOOST_TEST(std::equal(begin,end,answer)); } // Test copying { const std::string test_string = "abcdef"; token_iterator_generator::type beg, end, other; boost::array ar = {{1,2,3}}; offset_separator f(ar.begin(),ar.end()); beg = make_token_iterator(test_string.begin(),test_string.end(),f); ++beg; other = beg; ++other; BOOST_TEST(*beg=="bc"); BOOST_TEST(*other=="def"); other = make_token_iterator(test_string.begin(), test_string.end(),f); BOOST_TEST(*other=="a"); } // Test non-default constructed char_delimiters_separator { const std::string test_string = "how,are you, doing"; std::string answer[] = {"how",",","are you",","," doing"}; tokenizer<> t(test_string,char_delimiters_separator(true,",","")); BOOST_TEST(std::equal(t.begin(),t.end(),answer)); } return boost::report_errors(); }