#include #include int main(void) { boost::make_u32regex("\xed\xa0\x80"); // single lowest lead surrogate U+D800 boost::make_u32regex("\xed\xaf\xbf"); // single highest lead surrogate U+DBFF boost::make_u32regex("\xed\xb0\x80"); // single lowest trail surrogate U+DC00 boost::make_u32regex("\xed\xbf\xbf"); // single highest trail surrogate U+DFFF // overlong encodings (created by left-padding with zero bits) boost::make_u32regex("\xc0\x80"); // illegal 2-byte encoding of 1-byte character U+0000 boost::make_u32regex("\xe0\x80\x80"); // illegal 3-byte encoding of 1-byte character U+0000 boost::make_u32regex("\xf0\x80\x80\x80"); // illegal 4-byte encoding of 1-byte character U+0000 boost::make_u32regex("\xc1\xbf"); // illegal 2-byte encoding of 1-byte character U+007F boost::make_u32regex("\xe0\x81\xbf"); // illegal 3-byte encoding of 1-byte character U+007F boost::make_u32regex("\xf0\x80\x81\xbf"); // illegal 4-byte encoding of 1-byte character U+007F boost::make_u32regex("\xe0\x82\x80"); // illegal 3-byte encoding of 2-byte character U+0080 boost::make_u32regex("\xf0\x80\x82\x80"); // illegal 4-byte encoding of 2-byte character U+0080 boost::make_u32regex("\xe0\x9f\xbf"); // illegal 3-byte encoding of 2-byte character U+07FF boost::make_u32regex("\xf0\x80\x9f\xbf"); // illegal 4-byte encoding of 2-byte character U+07FF boost::make_u32regex("\xf0\x80\xa0\x80"); // illegal 4-byte encoding of 3-byte character U+0800 boost::make_u32regex("\xf0\x8f\xbf\xbf"); // illegal 4-byte encoding of 3-byte character U+FFFF return 0; }