webkit/glue/regular_expression_unittest.cc - platform/external/chromium - Git at Google

 // Copyright (c) 2006-2008 The Chromium Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "testing/gtest/include/gtest/gtest.h"
 #include "third_party/WebKit/Source/WebKit/chromium/public/WebRegularExpression.h"
 #include "third_party/WebKit/Source/WebKit/chromium/public/WebString.h"
 #include "third_party/WebKit/Source/WebKit/chromium/public/WebTextCaseSensitivity.h"

 using namespace WebKit;

 namespace {

 class RegexTest : public testing::Test {
 };

 struct Match {
   const WebUChar* text;
   const int textLength;
   const int matchPosition;
   const int matchLength;
 };

 void testMatches(const WebRegularExpression& regex,
                  const Match* matches,
                  const size_t nMatches) {

   for (size_t i = 0; i < nMatches; ++i) {
     int matchedLength = matches[i].textLength;
     EXPECT_EQ(matches[i].matchPosition, regex.match(
         WebString(matches[i].text, matches[i].textLength), 0, &matchedLength));
     if (matches[i].matchPosition != -1)
       EXPECT_EQ(matches[i].matchLength, matchedLength);
   }

 }

 }  // namespace

 #define MATCH_DESC(webuchar, matchPosition, matchLength) \
     { webuchar, arraysize(webuchar), matchPosition, matchLength }


 TEST(RegexTest, Basic) {
   // Just make sure we're not completely broken.
   WebRegularExpression regex("the quick brown fox", WebTextCaseSensitive);
   EXPECT_EQ(0, regex.match("the quick brown fox"));
   EXPECT_EQ(1, regex.match(" the quick brown fox"));
   EXPECT_EQ(3, regex.match("foothe quick brown foxbar"));

   EXPECT_EQ(-1, regex.match("The quick brown FOX"));
   EXPECT_EQ(-1, regex.match("the quick brown fo"));
 }

 TEST(RegexTest, Unicode) {
   // Make sure we get the right offsets for unicode strings.
   WebUChar pattern[] = {L'\x6240', L'\x6709', L'\x7f51', L'\x9875'};
   WebRegularExpression regex(WebString(pattern, arraysize(pattern)),
                              WebTextCaseInsensitive);

   WebUChar text1[] = {L'\x6240', L'\x6709', L'\x7f51', L'\x9875'};
   WebUChar text2[] = {L' ', L'\x6240', L'\x6709', L'\x7f51', L'\x9875'};
   WebUChar text3[] = {L'f', L'o', L'o', L'\x6240', L'\x6709', L'\x7f51', L'\x9875', L'b', L'a', L'r'};
   WebUChar text4[] = {L'\x4e2d', L'\x6587', L'\x7f51',  L'\x9875', L'\x6240', L'\x6709', L'\x7f51', L'\x9875'};

   const Match matches[] = {
     MATCH_DESC(text1, 0, 4),
     MATCH_DESC(text2, 1, 4),
     MATCH_DESC(text3, 3, 4),
     MATCH_DESC(text4, 4, 4),
   };

   testMatches(regex, matches, arraysize(matches));
 }

 TEST(RegexTest, UnicodeMixedLength) {
   WebUChar pattern[] = {L':', L'[', L' ', L'\x2000', L']', L'+', L':'};
   WebRegularExpression regex(WebString(pattern, arraysize(pattern)),
                              WebTextCaseInsensitive);

   WebUChar text1[] = {L':', L' ', L' ', L':'};
   WebUChar text2[] = {L' ', L' ', L':', L' ', L' ', L' ', L' ', L':', L' ', L' '};
   WebUChar text3[] = {L' ', L':', L' ', L'\x2000', L' ', L':', L' '};
   WebUChar text4[] = {L'\x6240', L'\x6709', L'\x7f51', L'\x9875', L' ', L':', L' ', L'\x2000', L' ', L'\x2000', L' ', L':', L' '};
   WebUChar text5[] = {L' '};
   WebUChar text6[] = {L':', L':'};

   const Match matches[] = {
     MATCH_DESC(text1, 0, 4),
     MATCH_DESC(text2, 2, 6),
     MATCH_DESC(text3, 1, 5),
     MATCH_DESC(text4, 5, 7),
     MATCH_DESC(text5, -1, -1),
     MATCH_DESC(text6, -1, -1),
   };

   testMatches(regex, matches, arraysize(matches));
 }

 TEST(RegexTest, EmptyMatch) {
   WebRegularExpression regex("|x", WebTextCaseInsensitive);
   int matchedLength = 0;
   EXPECT_EQ(0, regex.match("", 0, &matchedLength));
   EXPECT_EQ(0, matchedLength);
 }
	// Copyright (c) 2006-2008 The Chromium Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	#include "testing/gtest/include/gtest/gtest.h"
	#include "third_party/WebKit/Source/WebKit/chromium/public/WebRegularExpression.h"
	#include "third_party/WebKit/Source/WebKit/chromium/public/WebString.h"
	#include "third_party/WebKit/Source/WebKit/chromium/public/WebTextCaseSensitivity.h"

	using namespace WebKit;

	namespace {

	class RegexTest : public testing::Test {
	};

	struct Match {
	const WebUChar* text;
	const int textLength;
	const int matchPosition;
	const int matchLength;
	};

	void testMatches(const WebRegularExpression& regex,
	const Match* matches,
	const size_t nMatches) {

	for (size_t i = 0; i < nMatches; ++i) {
	int matchedLength = matches[i].textLength;
	EXPECT_EQ(matches[i].matchPosition, regex.match(
	WebString(matches[i].text, matches[i].textLength), 0, &matchedLength));
	if (matches[i].matchPosition != -1)
	EXPECT_EQ(matches[i].matchLength, matchedLength);
	}

	}

	} // namespace

	#define MATCH_DESC(webuchar, matchPosition, matchLength) \
	{ webuchar, arraysize(webuchar), matchPosition, matchLength }


	TEST(RegexTest, Basic) {
	// Just make sure we're not completely broken.
	WebRegularExpression regex("the quick brown fox", WebTextCaseSensitive);
	EXPECT_EQ(0, regex.match("the quick brown fox"));
	EXPECT_EQ(1, regex.match(" the quick brown fox"));
	EXPECT_EQ(3, regex.match("foothe quick brown foxbar"));

	EXPECT_EQ(-1, regex.match("The quick brown FOX"));
	EXPECT_EQ(-1, regex.match("the quick brown fo"));
	}

	TEST(RegexTest, Unicode) {
	// Make sure we get the right offsets for unicode strings.
	WebUChar pattern[] = {L'\x6240', L'\x6709', L'\x7f51', L'\x9875'};
	WebRegularExpression regex(WebString(pattern, arraysize(pattern)),
	WebTextCaseInsensitive);

	WebUChar text1[] = {L'\x6240', L'\x6709', L'\x7f51', L'\x9875'};
	WebUChar text2[] = {L' ', L'\x6240', L'\x6709', L'\x7f51', L'\x9875'};
	WebUChar text3[] = {L'f', L'o', L'o', L'\x6240', L'\x6709', L'\x7f51', L'\x9875', L'b', L'a', L'r'};
	WebUChar text4[] = {L'\x4e2d', L'\x6587', L'\x7f51', L'\x9875', L'\x6240', L'\x6709', L'\x7f51', L'\x9875'};

	const Match matches[] = {
	MATCH_DESC(text1, 0, 4),
	MATCH_DESC(text2, 1, 4),
	MATCH_DESC(text3, 3, 4),
	MATCH_DESC(text4, 4, 4),
	};

	testMatches(regex, matches, arraysize(matches));
	}

	TEST(RegexTest, UnicodeMixedLength) {
	WebUChar pattern[] = {L':', L'[', L' ', L'\x2000', L']', L'+', L':'};
	WebRegularExpression regex(WebString(pattern, arraysize(pattern)),
	WebTextCaseInsensitive);

	WebUChar text1[] = {L':', L' ', L' ', L':'};
	WebUChar text2[] = {L' ', L' ', L':', L' ', L' ', L' ', L' ', L':', L' ', L' '};
	WebUChar text3[] = {L' ', L':', L' ', L'\x2000', L' ', L':', L' '};
	WebUChar text4[] = {L'\x6240', L'\x6709', L'\x7f51', L'\x9875', L' ', L':', L' ', L'\x2000', L' ', L'\x2000', L' ', L':', L' '};
	WebUChar text5[] = {L' '};
	WebUChar text6[] = {L':', L':'};

	const Match matches[] = {
	MATCH_DESC(text1, 0, 4),
	MATCH_DESC(text2, 2, 6),
	MATCH_DESC(text3, 1, 5),
	MATCH_DESC(text4, 5, 7),
	MATCH_DESC(text5, -1, -1),
	MATCH_DESC(text6, -1, -1),
	};

	testMatches(regex, matches, arraysize(matches));
	}

	TEST(RegexTest, EmptyMatch) {
	WebRegularExpression regex("\|x", WebTextCaseInsensitive);
	int matchedLength = 0;
	EXPECT_EQ(0, regex.match("", 0, &matchedLength));
	EXPECT_EQ(0, matchedLength);
	}