etk/test/testRegExp.cpp

194 lines
6.5 KiB
C++
Raw Normal View History

/**
* @author Edouard DUPIN
*
* @copyright 2011, Edouard DUPIN, all right reserved
*
* @license MPL v2.0 (see license file)
*/
#include <etest/etest.hpp>
2017-08-22 21:20:43 +02:00
#include <etk/RegEx.hpp>
#include <test-debug/debug.hpp>
#define NAME "Hash"
2017-08-28 00:02:11 +02:00
etk::Pair<int32_t, int32_t> testRegExSingle(const etk::String& _expression, const etk::String& _search) {
etk::RegEx<etk::String> expression(_expression);
TK_INFO("Parse RegEx: \"" << expression.getRegExDecorated() << "\"");
2017-08-22 21:20:43 +02:00
TK_INFO(" IN: \"" << etk::regex::autoStr(_search) << "\"");
if (expression.parse(_search, 0, _search.size()) == true) {
TK_INFO(" match [" << expression.start() << ".." << expression.stop() << "] ");
2017-08-28 00:02:11 +02:00
TK_INFO(" ==> '" << etk::regex::autoStr(etk::String(_search, expression.start(), expression.stop() - expression.start())) << "'");
return etk::makePair(expression.start(), expression.stop());
}
TK_INFO(" ==> ---------------");
2017-08-28 00:02:11 +02:00
return etk::makePair(0,0);
}
2017-08-28 00:02:11 +02:00
static etk::String data1 = " a /* plop */ \n int eee = 22; // error value \nint main(void) {\n return 0;\n}\n";
static etk::String data2 = "alpha /* plop */ test";
static etk::String data3 = "pp \n // qdfqdfsdf \nde";
2017-08-22 21:20:43 +02:00
TEST(TestEtkRegEx, MultipleLineComment ) {
2017-08-28 00:02:11 +02:00
etk::String expression = "/\\*.*\\*/";
etk::Pair<int32_t, int32_t> res;
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data1);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(3,13));
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data2);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(6,16));
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data3);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(0,0));
}
2017-08-22 21:20:43 +02:00
TEST(TestEtkRegEx, MultipleEndDollar ) {
2017-08-28 00:02:11 +02:00
etk::String expression = "//.*$";
etk::Pair<int32_t, int32_t> res;
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data1);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(30,46));
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data2);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(0,0));
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data3);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(5,19));
}
2017-08-22 21:20:43 +02:00
TEST(TestEtkRegEx, MultipleNoEnd ) {
2017-08-28 00:02:11 +02:00
etk::String expression = "/\\*.*";
etk::Pair<int32_t, int32_t> res;
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data1);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(3,5));
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data2);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(6,8));
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data3);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(0,0));
}
2017-08-22 21:20:43 +02:00
TEST(TestEtkRegEx, aToZ ) {
2017-08-28 00:02:11 +02:00
etk::String expression = "[a-z]";
etk::Pair<int32_t, int32_t> res;
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data1);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(1,2));
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data2);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(0,1));
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, data3);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(0,1));
}
2017-08-22 21:20:43 +02:00
TEST(TestEtkRegEx, complexString ) {
2017-08-28 00:02:11 +02:00
etk::String expression = "a.*plop(z{2,3}|h+)+r";
etk::String dataToParse = " eesd a lzzml plophzzzzzhhhhhrlkmlkml";
etk::Pair<int32_t, int32_t> res;
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, dataToParse);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(7,31));
}
2017-08-22 21:20:43 +02:00
TEST(TestEtkRegEx, multipleUnderscore ) {
2017-08-28 00:02:11 +02:00
etk::String expression = "\\@\\w+_\\@";
etk::String dataToParse = " aaa_bbb_ plop_ ";
etk::Pair<int32_t, int32_t> res;
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, dataToParse);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(2,10));
}
2017-08-22 21:20:43 +02:00
TEST(TestEtkRegEx, endError ) {
2017-08-28 00:02:11 +02:00
etk::String expression = "\\@((0(x|X)[0-9a-fA-F]*)|(\\d+\\.?\\d*|\\.\\d+)((e|E)(\\+|\\-)?\\d+)?)(LL|L|l|UL|ul|u|U|F|f)?\\@";
etk::String dataToParse = "(95";
etk::Pair<int32_t, int32_t> res;
2017-08-22 21:20:43 +02:00
res = testRegExSingle(expression, dataToParse);
2017-08-28 00:02:11 +02:00
EXPECT_EQ(res, etk::makePair(7,31));
}
2017-08-22 21:20:43 +02:00
void testRegEx() {
2017-08-28 00:02:11 +02:00
etk::String data;
2017-08-28 00:02:11 +02:00
//etk::String data = "pp \n# plop // qdfqdfsdf \nde";
//etk::String data = "pp \n# plop //\\\n qdfqdfsdf \nde";
//etk::String data = "p#\ne";
2017-08-22 21:20:43 +02:00
//testRegExSingle("#(\\\\\\\\|\\\\\\n|.)*$", data);
//testRegExSingle("#.*$", data);
2017-08-28 00:02:11 +02:00
//etk::String data = "p//TODO:\ndse";
//etk::String data = "p// TODO:\ndse";
//etk::String data = "p// TODO :\ndse";
//etk::String data = "p// TODO : sdfgsdfsd \ndse";
2017-08-22 21:20:43 +02:00
//testRegExSingle("//[ \\t]*TODO[ \\t]*:.*$", data);
data = "abc m_def ghi";
data = " protected:\n"
" vec2 m_offset; \n";
2017-08-22 21:20:43 +02:00
//testRegExSingle("\\@m_[A-Za-z_0-9]*\\@", data);
data = " * @param[in] _mode Configuring mode.\n"
" * @param[in] _time Time in second of the annimation display\n"
" */\n"
" void setAnnimationTime(enum ";
data = "virtual vec2 relativePosition(const vec2& _pos);";
2017-08-22 21:20:43 +02:00
//testRegExSingle("\\@(\\w|_)+[ \\t]*\\(", data);
data = "include <ewol/Dimensio2n.h>\n"
"#include <ewol/Dimension.h>\n"
"'dfgd\'fg'\n"
"\"dqf\\\"gsdfg\" // \"\n"
"// TODO : sqdkfjsdldkqfj\n"
"\n"
"namespace ewol {\n"
" class Widget;\n"
" namespace widget {\n"
" class Manager;\n"
" class Windows;\n"
" };\n"
"};\n"
"#include <etk/types.h>\n";
2017-08-22 21:20:43 +02:00
//testRegExSingle("#(\\\\[\\\\\\n]|.)*$", data);
data = " 'dfgd\\'fg' \n"
" vec2 m_offset; \n";
2017-08-22 21:20:43 +02:00
//testRegExSingle("'((\\\\[\\\\'])|.)*'", data);
/*
data = "ddfgdfgh";
2017-08-28 00:02:11 +02:00
etk::RegEx<etk::String> reg(".*");
reg.setMaximize(true);
TK_INFO("Parse RegEx : '" << reg.getRegExDecorated() << "'");
if (reg.parse(data, 0, data.size()) == true) {
//if (reg.processOneElement(data, 0, data.size()) == true) {
TK_INFO(" match [" << reg.start() << ".." << reg.stop() << "] ");
2017-08-28 00:02:11 +02:00
TK_INFO(" ==> '" << etk::String(data, reg.start(), reg.stop()-reg.start()) << "'");
}
data = "plop \"\" sdfsdf s\"swdfsqd sdfgsdfg \" \" sdfsf";
2017-08-28 00:02:11 +02:00
reg = etk::RegEx<etk::String>("\"(\\\\[\\\\\"]|.)*\"");
reg.setMaximize(false);
TK_INFO("Parse RegEx : '" << reg.getRegExDecorated() << "'");
if (reg.parse(data, 0, data.size()) == true) {
//if (reg.processOneElement(data, 0, data.size()) == true) {
TK_INFO(" match [" << reg.start() << ".." << reg.stop() << "] ");
2017-08-28 00:02:11 +02:00
TK_INFO(" ==> '" << etk::String(data, reg.start(), reg.stop()-reg.start()) << "'");
}
//TODO : good : "(\\+|[0-9])*" ==> really bad : "(+|[0-9])*"
data = "void limit(const vec2& _origin, const vec2& _size);\n";
2017-08-28 00:02:11 +02:00
reg = etk::RegEx<etk::String>("\\@(\\w|_)+[ \\t]*\\(");
reg.setMaximize(false);
TK_INFO("Parse RegEx : '" << reg.getRegExDecorated() << "'");
if (reg.parse(data, 0, data.size()) == true) {
//if (reg.processOneElement(data, 0, data.size()) == true) {
TK_INFO(" match [" << reg.start() << ".." << reg.stop() << "] ");
2017-08-28 00:02:11 +02:00
TK_INFO(" ==> '" << etk::String(data, reg.start(), reg.stop()-reg.start()) << "'");
}
data = "void limit const vec2& _origin, const vec2& _size);\n";
if (reg.parse(data, 0, data.size()) == true) {
//if (reg.processOneElement(data, 0, data.size()) == true) {
TK_INFO(" match [" << reg.start() << ".." << reg.stop() << "] ");
2017-08-28 00:02:11 +02:00
TK_INFO(" ==> '" << etk::String(data, reg.start(), reg.stop()-reg.start()) << "'");
}
*/
}