forked from mirrors/gecko-dev
		
	
		
			
				
	
	
		
			358 lines
		
	
	
	
		
			12 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			358 lines
		
	
	
	
		
			12 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
/* ***** BEGIN LICENSE BLOCK *****
 | 
						|
 * Version: MPL 1.1/GPL 2.0/LGPL 2.1
 | 
						|
 *
 | 
						|
 * The contents of this file are subject to the Mozilla Public License Version
 | 
						|
 * 1.1 (the "License"); you may not use this file except in compliance with
 | 
						|
 * the License. You may obtain a copy of the License at
 | 
						|
 * http://www.mozilla.org/MPL/
 | 
						|
 *
 | 
						|
 * Software distributed under the License is distributed on an "AS IS" basis,
 | 
						|
 * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
 | 
						|
 * for the specific language governing rights and limitations under the
 | 
						|
 * License.
 | 
						|
 *
 | 
						|
 * The Original Code is Url Classifier code
 | 
						|
 *
 | 
						|
 * The Initial Developer of the Original Code is
 | 
						|
 * Google Inc.
 | 
						|
 * Portions created by the Initial Developer are Copyright (C) 2007
 | 
						|
 * the Initial Developer. All Rights Reserved.
 | 
						|
 *
 | 
						|
 * Contributor(s):
 | 
						|
 *
 | 
						|
 * Alternatively, the contents of this file may be used under the terms of
 | 
						|
 * either the GNU General Public License Version 2 or later (the "GPL"), or
 | 
						|
 * the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
 | 
						|
 * in which case the provisions of the GPL or the LGPL are applicable instead
 | 
						|
 * of those above. If you wish to allow use of your version of this file only
 | 
						|
 * under the terms of either the GPL or the LGPL, and not to allow others to
 | 
						|
 * use your version of this file under the terms of the MPL, indicate your
 | 
						|
 * decision by deleting the provisions above and replace them with the notice
 | 
						|
 * and other provisions required by the GPL or the LGPL. If you do not delete
 | 
						|
 * the provisions above, a recipient may use your version of this file under
 | 
						|
 * the terms of any one of the MPL, the GPL or the LGPL.
 | 
						|
 *
 | 
						|
 * ***** END LICENSE BLOCK ***** */
 | 
						|
 | 
						|
#include <stdio.h>
 | 
						|
#include <ctype.h>
 | 
						|
#include "nsEscape.h"
 | 
						|
#include "nsString.h"
 | 
						|
#include "nsUrlClassifierUtils.h"
 | 
						|
#include "nsNetUtil.h"
 | 
						|
#include "stdlib.h"
 | 
						|
#include "TestHarness.h"
 | 
						|
 | 
						|
static int gTotalTests = 0;
 | 
						|
static int gPassedTests = 0;
 | 
						|
 | 
						|
static char int_to_hex_digit(PRInt32 i) {
 | 
						|
  NS_ASSERTION((i >= 0) && (i <= 15), "int too big in int_to_hex_digit");
 | 
						|
  return static_cast<char>(((i < 10) ? (i + '0') : ((i - 10) + 'A')));
 | 
						|
}
 | 
						|
 | 
						|
static void CheckEquals(nsCString & expected, nsCString & actual)
 | 
						|
{
 | 
						|
  if (!(expected).Equals((actual))) {
 | 
						|
    fail("expected |%s| but got |%s|", (expected).get(), (actual).get());
 | 
						|
  } else {
 | 
						|
    gPassedTests++;
 | 
						|
  }
 | 
						|
  gTotalTests++;
 | 
						|
}
 | 
						|
 | 
						|
void TestUnescapeHelper(const char* in, const char* expected)
 | 
						|
{
 | 
						|
  nsCString out, strIn(in), strExp(expected);
 | 
						|
  nsUrlClassifierUtils utils;
 | 
						|
  
 | 
						|
  NS_UnescapeURL(strIn.get(), strIn.Length(), esc_AlwaysCopy, out);
 | 
						|
  CheckEquals(strExp, out);
 | 
						|
}
 | 
						|
 | 
						|
// Make sure Unescape from nsEncode.h's unescape does what the server does.
 | 
						|
void TestUnescape()
 | 
						|
{
 | 
						|
  // test empty string
 | 
						|
  TestUnescapeHelper("\0", "\0");
 | 
						|
 | 
						|
  // Test docoding of all characters.
 | 
						|
  nsCString allCharsEncoded, allCharsEncodedLowercase, allCharsAsString;
 | 
						|
  for (PRInt32 i = 1; i < 256; ++i) {
 | 
						|
    allCharsEncoded.Append('%');
 | 
						|
    allCharsEncoded.Append(int_to_hex_digit(i / 16));
 | 
						|
    allCharsEncoded.Append((int_to_hex_digit(i % 16)));
 | 
						|
    
 | 
						|
    allCharsEncodedLowercase.Append('%');
 | 
						|
    allCharsEncodedLowercase.Append(tolower(int_to_hex_digit(i / 16)));
 | 
						|
    allCharsEncodedLowercase.Append(tolower(int_to_hex_digit(i % 16)));
 | 
						|
    
 | 
						|
    allCharsAsString.Append(static_cast<char>(i));
 | 
						|
  }
 | 
						|
  
 | 
						|
  nsUrlClassifierUtils utils;
 | 
						|
  nsCString out;
 | 
						|
  NS_UnescapeURL(allCharsEncoded.get(), allCharsEncoded.Length(), esc_AlwaysCopy, out);
 | 
						|
  CheckEquals(allCharsAsString, out);
 | 
						|
  
 | 
						|
  out.Truncate();
 | 
						|
  NS_UnescapeURL(allCharsEncodedLowercase.get(), allCharsEncodedLowercase.Length(), esc_AlwaysCopy, out);
 | 
						|
  CheckEquals(allCharsAsString, out);
 | 
						|
 | 
						|
  // Test %-related edge cases
 | 
						|
  TestUnescapeHelper("%", "%");
 | 
						|
  TestUnescapeHelper("%xx", "%xx");
 | 
						|
  TestUnescapeHelper("%%", "%%");
 | 
						|
  TestUnescapeHelper("%%%", "%%%");
 | 
						|
  TestUnescapeHelper("%%%%", "%%%%");
 | 
						|
  TestUnescapeHelper("%1", "%1");
 | 
						|
  TestUnescapeHelper("%1z", "%1z");
 | 
						|
  TestUnescapeHelper("a%1z", "a%1z");
 | 
						|
  TestUnescapeHelper("abc%d%e%fg%hij%klmno%", "abc%d%e%fg%hij%klmno%");
 | 
						|
 | 
						|
  // A few more tests
 | 
						|
  TestUnescapeHelper("%25", "%");
 | 
						|
  TestUnescapeHelper("%25%32%35", "%25");
 | 
						|
}
 | 
						|
 | 
						|
void TestEncodeHelper(const char* in, const char* expected)
 | 
						|
{
 | 
						|
  nsCString out, strIn(in), strExp(expected);
 | 
						|
  nsUrlClassifierUtils utils;
 | 
						|
 | 
						|
  utils.SpecialEncode(strIn, PR_TRUE, out);
 | 
						|
  CheckEquals(strExp, out);
 | 
						|
}
 | 
						|
 | 
						|
void TestEnc()
 | 
						|
{
 | 
						|
  // Test empty string
 | 
						|
  TestEncodeHelper("", "");
 | 
						|
 | 
						|
  // Test that all characters we shouldn't encode ([33-36],[38,126]) are not.
 | 
						|
  nsCString noenc;
 | 
						|
  for (PRInt32 i = 33; i < 127; i++) {
 | 
						|
    if (i != 37) {                      // skip %
 | 
						|
      noenc.Append(static_cast<char>(i));
 | 
						|
    }
 | 
						|
  }
 | 
						|
  nsUrlClassifierUtils utils;
 | 
						|
  nsCString out;
 | 
						|
  utils.SpecialEncode(noenc, PR_FALSE, out);
 | 
						|
  CheckEquals(noenc, out);
 | 
						|
 | 
						|
  // Test that all the chars that we should encode [0,32],37,[127,255] are
 | 
						|
  nsCString yesAsString, yesExpectedString;
 | 
						|
  for (PRInt32 i = 1; i < 256; i++) {
 | 
						|
    if (i < 33 || i == 37 || i > 126) {
 | 
						|
      yesAsString.Append(static_cast<char>(i));
 | 
						|
      yesExpectedString.Append('%');
 | 
						|
      yesExpectedString.Append(int_to_hex_digit(i / 16));
 | 
						|
      yesExpectedString.Append(int_to_hex_digit(i % 16));
 | 
						|
    }
 | 
						|
  }
 | 
						|
  
 | 
						|
  out.Truncate();
 | 
						|
  utils.SpecialEncode(yesAsString, PR_FALSE, out);
 | 
						|
  CheckEquals(yesExpectedString, out);
 | 
						|
 | 
						|
  TestEncodeHelper("blah//blah", "blah/blah");
 | 
						|
}
 | 
						|
 | 
						|
void TestCanonicalizeHelper(const char* in, const char* expected)
 | 
						|
{
 | 
						|
  nsCString out, strIn(in), strExp(expected);
 | 
						|
  nsUrlClassifierUtils utils;
 | 
						|
 | 
						|
  utils.CanonicalizePath(strIn, out);
 | 
						|
  CheckEquals(strExp, out);
 | 
						|
}
 | 
						|
 | 
						|
void TestCanonicalize()
 | 
						|
{
 | 
						|
  // Test repeated %-decoding. Note: %25 --> %, %32 --> 2, %35 --> 5
 | 
						|
  TestCanonicalizeHelper("%25", "%25");
 | 
						|
  TestCanonicalizeHelper("%25%32%35", "%25");
 | 
						|
  TestCanonicalizeHelper("asdf%25%32%35asd", "asdf%25asd");
 | 
						|
  TestCanonicalizeHelper("%%%25%32%35asd%%", "%25%25%25asd%25%25");
 | 
						|
  TestCanonicalizeHelper("%25%32%35%25%32%35%25%32%35", "%25%25%25");
 | 
						|
  TestCanonicalizeHelper("%25", "%25");
 | 
						|
  TestCanonicalizeHelper("%257Ea%2521b%2540c%2523d%2524e%25f%255E00%252611%252A22%252833%252944_55%252B",
 | 
						|
      "~a!b@c#d$e%25f^00&11*22(33)44_55+");
 | 
						|
 | 
						|
  TestCanonicalizeHelper("", "");
 | 
						|
  TestCanonicalizeHelper("%31%36%38%2e%31%38%38%2e%39%39%2e%32%36/%2E%73%65%63%75%72%65/%77%77%77%2E%65%62%61%79%2E%63%6F%6D/",
 | 
						|
                         "168.188.99.26/.secure/www.ebay.com/");
 | 
						|
  TestCanonicalizeHelper("195.127.0.11/uploads/%20%20%20%20/.verify/.eBaysecure=updateuserdataxplimnbqmn-xplmvalidateinfoswqpcmlx=hgplmcx/",
 | 
						|
                         "195.127.0.11/uploads/%20%20%20%20/.verify/.eBaysecure=updateuserdataxplimnbqmn-xplmvalidateinfoswqpcmlx=hgplmcx/");
 | 
						|
  // Added in bug 489455.  %00 should no longer be changed to %01.
 | 
						|
  TestCanonicalizeHelper("%00", "%00");
 | 
						|
}
 | 
						|
 | 
						|
void TestParseIPAddressHelper(const char *in, const char *expected)
 | 
						|
{
 | 
						|
  nsCString out, strIn(in), strExp(expected);
 | 
						|
  nsUrlClassifierUtils utils;
 | 
						|
  utils.Init();
 | 
						|
 | 
						|
  utils.ParseIPAddress(strIn, out);
 | 
						|
  CheckEquals(strExp, out);
 | 
						|
}
 | 
						|
 | 
						|
void TestParseIPAddress()
 | 
						|
{
 | 
						|
  TestParseIPAddressHelper("123.123.0.0.1", "");
 | 
						|
  TestParseIPAddressHelper("255.0.0.1", "255.0.0.1");
 | 
						|
  TestParseIPAddressHelper("12.0x12.01234", "12.18.2.156");
 | 
						|
  TestParseIPAddressHelper("276.2.3", "20.2.0.3");
 | 
						|
  TestParseIPAddressHelper("012.034.01.055", "10.28.1.45");
 | 
						|
  TestParseIPAddressHelper("0x12.0x43.0x44.0x01", "18.67.68.1");
 | 
						|
  TestParseIPAddressHelper("167838211", "10.1.2.3");
 | 
						|
  TestParseIPAddressHelper("3279880203", "195.127.0.11");
 | 
						|
  TestParseIPAddressHelper("0x12434401", "18.67.68.1");
 | 
						|
  TestParseIPAddressHelper("413960661", "24.172.137.213");
 | 
						|
  TestParseIPAddressHelper("03053104725", "24.172.137.213");
 | 
						|
  TestParseIPAddressHelper("030.0254.0x89d5", "24.172.137.213");
 | 
						|
  TestParseIPAddressHelper("1.234.4.0377", "1.234.4.255");
 | 
						|
  TestParseIPAddressHelper("1.2.3.00x0", "");
 | 
						|
  TestParseIPAddressHelper("10.192.95.89 xy", "10.192.95.89");
 | 
						|
  TestParseIPAddressHelper("10.192.95.89 xyz", "");
 | 
						|
  TestParseIPAddressHelper("1.2.3.0x0", "1.2.3.0");
 | 
						|
  TestParseIPAddressHelper("1.2.3.4", "1.2.3.4");
 | 
						|
}
 | 
						|
 | 
						|
void TestCanonicalNumHelper(const char *in, PRUint32 bytes,
 | 
						|
                            bool allowOctal, const char *expected)
 | 
						|
{
 | 
						|
  nsCString out, strIn(in), strExp(expected);
 | 
						|
  nsUrlClassifierUtils utils;
 | 
						|
  utils.Init();
 | 
						|
 | 
						|
  utils.CanonicalNum(strIn, bytes, allowOctal, out);
 | 
						|
  CheckEquals(strExp, out);
 | 
						|
}
 | 
						|
 | 
						|
void TestCanonicalNum()
 | 
						|
{
 | 
						|
  TestCanonicalNumHelper("", 1, true, "");
 | 
						|
  TestCanonicalNumHelper("10", 0, true, "");
 | 
						|
  TestCanonicalNumHelper("45", 1, true, "45");
 | 
						|
  TestCanonicalNumHelper("0x10", 1, true, "16");
 | 
						|
  TestCanonicalNumHelper("367", 2, true, "1.111");
 | 
						|
  TestCanonicalNumHelper("012345", 3, true, "0.20.229");
 | 
						|
  TestCanonicalNumHelper("0173", 1, true, "123");
 | 
						|
  TestCanonicalNumHelper("09", 1, false, "9");
 | 
						|
  TestCanonicalNumHelper("0x120x34", 2, true, "");
 | 
						|
  TestCanonicalNumHelper("0x12fc", 2, true, "18.252");
 | 
						|
  TestCanonicalNumHelper("3279880203", 4, true, "195.127.0.11");
 | 
						|
  TestCanonicalNumHelper("0x0000059", 1, true, "89");
 | 
						|
  TestCanonicalNumHelper("0x00000059", 1, true, "89");
 | 
						|
  TestCanonicalNumHelper("0x0000067", 1, true, "103");
 | 
						|
}
 | 
						|
 | 
						|
void TestHostnameHelper(const char *in, const char *expected)
 | 
						|
{
 | 
						|
  nsCString out, strIn(in), strExp(expected);
 | 
						|
  nsUrlClassifierUtils utils;
 | 
						|
  utils.Init();
 | 
						|
 | 
						|
  utils.CanonicalizeHostname(strIn, out);
 | 
						|
  CheckEquals(strExp, out);
 | 
						|
}
 | 
						|
 | 
						|
void TestHostname()
 | 
						|
{
 | 
						|
  TestHostnameHelper("abcd123;[]", "abcd123;[]");
 | 
						|
  TestHostnameHelper("abc.123", "abc.123");
 | 
						|
  TestHostnameHelper("abc..123", "abc.123");
 | 
						|
  TestHostnameHelper("trailing.", "trailing");
 | 
						|
  TestHostnameHelper("i love trailing dots....", "i%20love%20trailing%20dots");
 | 
						|
  TestHostnameHelper(".leading", "leading");
 | 
						|
  TestHostnameHelper("..leading", "leading");
 | 
						|
  TestHostnameHelper(".dots.", "dots");
 | 
						|
  TestHostnameHelper(".both.", "both");
 | 
						|
  TestHostnameHelper(".both..", "both");
 | 
						|
  TestHostnameHelper("..both.", "both");
 | 
						|
  TestHostnameHelper("..both..", "both");
 | 
						|
  TestHostnameHelper("..a.b.c.d..", "a.b.c.d");
 | 
						|
  TestHostnameHelper("..127.0.0.1..", "127.0.0.1");
 | 
						|
  TestHostnameHelper("asdf!@#$a", "asdf!@#$a");
 | 
						|
  TestHostnameHelper("AB CD 12354", "ab%20cd%2012354");
 | 
						|
  TestHostnameHelper("\1\2\3\4\112\177", "%01%02%03%04j%7F");
 | 
						|
  TestHostnameHelper("<>.AS/-+", "<>.as/-+");
 | 
						|
  // Added in bug 489455.  %00 should no longer be changed to %01.
 | 
						|
  TestHostnameHelper("%00", "%00");
 | 
						|
}
 | 
						|
 | 
						|
void TestLongHostname()
 | 
						|
{
 | 
						|
  static const int kTestSize = 1024 * 150;
 | 
						|
  char *str = static_cast<char*>(malloc(kTestSize + 1));
 | 
						|
  memset(str, 'x', kTestSize);
 | 
						|
  str[kTestSize] = '\0';
 | 
						|
 | 
						|
  nsUrlClassifierUtils utils;
 | 
						|
  utils.Init();
 | 
						|
 | 
						|
  nsCAutoString out;
 | 
						|
  nsDependentCString in(str);
 | 
						|
  PRIntervalTime clockStart = PR_IntervalNow();
 | 
						|
  utils.CanonicalizeHostname(in, out);
 | 
						|
  PRIntervalTime clockEnd = PR_IntervalNow();
 | 
						|
 | 
						|
  CheckEquals(in, out);
 | 
						|
 | 
						|
  printf("CanonicalizeHostname on long string (%dms)\n",
 | 
						|
         PR_IntervalToMilliseconds(clockEnd - clockStart));
 | 
						|
}
 | 
						|
 | 
						|
void TestFragmentSet()
 | 
						|
{
 | 
						|
  nsUrlClassifierFragmentSet set;
 | 
						|
  set.Init(3);
 | 
						|
 | 
						|
  set.Put(NS_LITERAL_CSTRING("a"));
 | 
						|
  set.Put(NS_LITERAL_CSTRING("b"));
 | 
						|
  set.Put(NS_LITERAL_CSTRING("c"));
 | 
						|
 | 
						|
  // At this point, adding a fourth element would push "a" off.
 | 
						|
  // Make sure that set.Has("a") moves it to the front of the list
 | 
						|
  set.Has(NS_LITERAL_CSTRING("a"));
 | 
						|
 | 
						|
  // Now add a new item.  This should now push "b" off the list,
 | 
						|
  // but leave "a"
 | 
						|
  set.Put(NS_LITERAL_CSTRING("d"));
 | 
						|
 | 
						|
  gTotalTests++;
 | 
						|
  if (set.Has(NS_LITERAL_CSTRING("a")))
 | 
						|
    gPassedTests++;
 | 
						|
  else
 | 
						|
    fail("set.Has(\"a\") failed.");
 | 
						|
 | 
						|
  gTotalTests++;
 | 
						|
  if (!set.Has(NS_LITERAL_CSTRING("b")))
 | 
						|
    gPassedTests++;
 | 
						|
  else
 | 
						|
    fail("!set.Has(\"b\") failed.");
 | 
						|
}
 | 
						|
 | 
						|
int main(int argc, char **argv)
 | 
						|
{
 | 
						|
  ScopedXPCOM xpcom("URLClassiferUtils");
 | 
						|
 | 
						|
  TestUnescape();
 | 
						|
  TestEnc();
 | 
						|
  TestCanonicalize();
 | 
						|
  TestCanonicalNum();
 | 
						|
  TestParseIPAddress();
 | 
						|
  TestHostname();
 | 
						|
  TestLongHostname();
 | 
						|
  TestFragmentSet();
 | 
						|
 | 
						|
  if (gPassedTests == gTotalTests)
 | 
						|
    passed(__FILE__);
 | 
						|
  printf("%d of %d tests passed\n", gPassedTests, gTotalTests);
 | 
						|
  // Non-zero return status signals test failure to build system.
 | 
						|
 | 
						|
  return (gPassedTests != gTotalTests);
 | 
						|
}
 |