/* ***** BEGIN LICENSE BLOCK ***** * Version: MPL 1.1/GPL 2.0/LGPL 2.1 * * The contents of this file are subject to the Mozilla Public License Version * 1.1 (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * http://www.mozilla.org/MPL/ * * Software distributed under the License is distributed on an "AS IS" basis, * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License * for the specific language governing rights and limitations under the * License. * * The Original Code is Url Classifier code * * The Initial Developer of the Original Code is * Google Inc. * Portions created by the Initial Developer are Copyright (C) 2007 * the Initial Developer. All Rights Reserved. * * Contributor(s): * * Alternatively, the contents of this file may be used under the terms of * either the GNU General Public License Version 2 or later (the "GPL"), or * the GNU Lesser General Public License Version 2.1 or later (the "LGPL"), * in which case the provisions of the GPL or the LGPL are applicable instead * of those above. If you wish to allow use of your version of this file only * under the terms of either the GPL or the LGPL, and not to allow others to * use your version of this file under the terms of the MPL, indicate your * decision by deleting the provisions above and replace them with the notice * and other provisions required by the GPL or the LGPL. If you do not delete * the provisions above, a recipient may use your version of this file under * the terms of any one of the MPL, the GPL or the LGPL. * * ***** END LICENSE BLOCK ***** */ #include #include #include "nsEscape.h" #include "nsString.h" #include "nsUrlClassifierUtils.h" #include "nsNetUtil.h" #include "stdlib.h" static int gTotalTests = 0; static int gPassedTests = 0; static char int_to_hex_digit(PRInt32 i) { NS_ASSERTION((i >= 0) && (i <= 15), "int too big in int_to_hex_digit"); return static_cast(((i < 10) ? (i + '0') : ((i - 10) + 'A'))); } static void CheckEquals(nsCString & expected, nsCString & actual) { if (!(expected).Equals((actual))) { fprintf(stderr, "FAILED: expected |%s| but was |%s|\n", (expected).get(), (actual).get()); } else { gPassedTests++; } gTotalTests++; } void TestUnescapeHelper(const char* in, const char* expected) { nsCString out, strIn(in), strExp(expected); nsUrlClassifierUtils utils; NS_UnescapeURL(strIn.get(), strIn.Length(), esc_AlwaysCopy, out); CheckEquals(strExp, out); } // Make sure Unescape from nsEncode.h's unescape does what the server does. void TestUnescape() { // test empty string TestUnescapeHelper("\0", "\0"); // Test docoding of all characters. nsCString allCharsEncoded, allCharsEncodedLowercase, allCharsAsString; for (PRInt32 i = 1; i < 256; ++i) { allCharsEncoded.Append('%'); allCharsEncoded.Append(int_to_hex_digit(i / 16)); allCharsEncoded.Append((int_to_hex_digit(i % 16))); allCharsEncodedLowercase.Append('%'); allCharsEncodedLowercase.Append(tolower(int_to_hex_digit(i / 16))); allCharsEncodedLowercase.Append(tolower(int_to_hex_digit(i % 16))); allCharsAsString.Append(static_cast(i)); } nsUrlClassifierUtils utils; nsCString out; NS_UnescapeURL(allCharsEncoded.get(), allCharsEncoded.Length(), esc_AlwaysCopy, out); CheckEquals(allCharsAsString, out); out.Truncate(); NS_UnescapeURL(allCharsEncodedLowercase.get(), allCharsEncodedLowercase.Length(), esc_AlwaysCopy, out); CheckEquals(allCharsAsString, out); // Test %-related edge cases TestUnescapeHelper("%", "%"); TestUnescapeHelper("%xx", "%xx"); TestUnescapeHelper("%%", "%%"); TestUnescapeHelper("%%%", "%%%"); TestUnescapeHelper("%%%%", "%%%%"); TestUnescapeHelper("%1", "%1"); TestUnescapeHelper("%1z", "%1z"); TestUnescapeHelper("a%1z", "a%1z"); TestUnescapeHelper("abc%d%e%fg%hij%klmno%", "abc%d%e%fg%hij%klmno%"); // A few more tests TestUnescapeHelper("%25", "%"); TestUnescapeHelper("%25%32%35", "%25"); } void TestEncodeHelper(const char* in, const char* expected) { nsCString out, strIn(in), strExp(expected); nsUrlClassifierUtils utils; utils.SpecialEncode(strIn, PR_TRUE, out); CheckEquals(strExp, out); } void TestEnc() { // Test empty string TestEncodeHelper("", ""); // Test that all characters we shouldn't encode ([33-36],[38,126]) are not. nsCString noenc; for (PRInt32 i = 33; i < 127; i++) { if (i != 37) { // skip % noenc.Append(static_cast(i)); } } nsUrlClassifierUtils utils; nsCString out; utils.SpecialEncode(noenc, PR_FALSE, out); CheckEquals(noenc, out); // Test that all the chars that we should encode [0,32],37,[127,255] are nsCString yesAsString, yesExpectedString; for (PRInt32 i = 1; i < 256; i++) { if (i < 33 || i == 37 || i > 126) { yesAsString.Append(static_cast(i)); yesExpectedString.Append('%'); yesExpectedString.Append(int_to_hex_digit(i / 16)); yesExpectedString.Append(int_to_hex_digit(i % 16)); } } out.Truncate(); utils.SpecialEncode(yesAsString, PR_FALSE, out); CheckEquals(yesExpectedString, out); TestEncodeHelper("blah//blah", "blah/blah"); } void TestCanonicalizeHelper(const char* in, const char* expected) { nsCString out, strIn(in), strExp(expected); nsUrlClassifierUtils utils; utils.CanonicalizePath(strIn, out); CheckEquals(strExp, out); } void TestCanonicalize() { // Test repeated %-decoding. Note: %25 --> %, %32 --> 2, %35 --> 5 TestCanonicalizeHelper("%25", "%25"); TestCanonicalizeHelper("%25%32%35", "%25"); TestCanonicalizeHelper("asdf%25%32%35asd", "asdf%25asd"); TestCanonicalizeHelper("%%%25%32%35asd%%", "%25%25%25asd%25%25"); TestCanonicalizeHelper("%25%32%35%25%32%35%25%32%35", "%25%25%25"); TestCanonicalizeHelper("%25", "%25"); TestCanonicalizeHelper("%257Ea%2521b%2540c%2523d%2524e%25f%255E00%252611%252A22%252833%252944_55%252B", "~a!b@c#d$e%25f^00&11*22(33)44_55+"); TestCanonicalizeHelper("", ""); TestCanonicalizeHelper("%31%36%38%2e%31%38%38%2e%39%39%2e%32%36/%2E%73%65%63%75%72%65/%77%77%77%2E%65%62%61%79%2E%63%6F%6D/", "168.188.99.26/.secure/www.ebay.com/"); TestCanonicalizeHelper("195.127.0.11/uploads/%20%20%20%20/.verify/.eBaysecure=updateuserdataxplimnbqmn-xplmvalidateinfoswqpcmlx=hgplmcx/", "195.127.0.11/uploads/%20%20%20%20/.verify/.eBaysecure=updateuserdataxplimnbqmn-xplmvalidateinfoswqpcmlx=hgplmcx/"); } void TestParseIPAddressHelper(const char *in, const char *expected) { nsCString out, strIn(in), strExp(expected); nsUrlClassifierUtils utils; utils.Init(); utils.ParseIPAddress(strIn, out); CheckEquals(strExp, out); } void TestParseIPAddress() { TestParseIPAddressHelper("123.123.0.0.1", ""); TestParseIPAddressHelper("255.0.0.1", "255.0.0.1"); TestParseIPAddressHelper("12.0x12.01234", "12.18.2.156"); TestParseIPAddressHelper("276.2.3", "20.2.0.3"); TestParseIPAddressHelper("012.034.01.055", "10.28.1.45"); TestParseIPAddressHelper("0x12.0x43.0x44.0x01", "18.67.68.1"); TestParseIPAddressHelper("167838211", "10.1.2.3"); TestParseIPAddressHelper("3279880203", "195.127.0.11"); TestParseIPAddressHelper("0x12434401", "18.67.68.1"); TestParseIPAddressHelper("413960661", "24.172.137.213"); TestParseIPAddressHelper("03053104725", "24.172.137.213"); TestParseIPAddressHelper("030.0254.0x89d5", "24.172.137.213"); TestParseIPAddressHelper("1.234.4.0377", "1.234.4.255"); TestParseIPAddressHelper("1.2.3.00x0", ""); TestParseIPAddressHelper("10.192.95.89 xy", "10.192.95.89"); TestParseIPAddressHelper("10.192.95.89 xyz", ""); TestParseIPAddressHelper("1.2.3.0x0", "1.2.3.0"); TestParseIPAddressHelper("1.2.3.4", "1.2.3.4"); } void TestCanonicalNumHelper(const char *in, PRUint32 bytes, bool allowOctal, const char *expected) { nsCString out, strIn(in), strExp(expected); nsUrlClassifierUtils utils; utils.Init(); utils.CanonicalNum(strIn, bytes, allowOctal, out); CheckEquals(strExp, out); } void TestCanonicalNum() { TestCanonicalNumHelper("", 1, true, ""); TestCanonicalNumHelper("10", 0, true, ""); TestCanonicalNumHelper("45", 1, true, "45"); TestCanonicalNumHelper("0x10", 1, true, "16"); TestCanonicalNumHelper("367", 2, true, "1.111"); TestCanonicalNumHelper("012345", 3, true, "0.20.229"); TestCanonicalNumHelper("0173", 1, true, "123"); TestCanonicalNumHelper("09", 1, false, "9"); TestCanonicalNumHelper("0x120x34", 2, true, ""); TestCanonicalNumHelper("0x12fc", 2, true, "18.252"); TestCanonicalNumHelper("3279880203", 4, true, "195.127.0.11"); TestCanonicalNumHelper("0x0000059", 1, true, "89"); TestCanonicalNumHelper("0x00000059", 1, true, "89"); TestCanonicalNumHelper("0x0000067", 1, true, "103"); } void TestHostnameHelper(const char *in, const char *expected) { nsCString out, strIn(in), strExp(expected); nsUrlClassifierUtils utils; utils.Init(); utils.CanonicalizeHostname(strIn, out); CheckEquals(strExp, out); } void TestHostname() { TestHostnameHelper("abcd123;[]", "abcd123;[]"); TestHostnameHelper("abc.123", "abc.123"); TestHostnameHelper("abc..123", "abc.123"); TestHostnameHelper("trailing.", "trailing"); TestHostnameHelper("i love trailing dots....", "i%20love%20trailing%20dots"); TestHostnameHelper(".leading", "leading"); TestHostnameHelper("..leading", "leading"); TestHostnameHelper(".dots.", "dots"); TestHostnameHelper(".both.", "both"); TestHostnameHelper(".both..", "both"); TestHostnameHelper("..both.", "both"); TestHostnameHelper("..both..", "both"); TestHostnameHelper("..a.b.c.d..", "a.b.c.d"); TestHostnameHelper("..127.0.0.1..", "127.0.0.1"); TestHostnameHelper("asdf!@#$a", "asdf!@#$a"); TestHostnameHelper("AB CD 12354", "ab%20cd%2012354"); TestHostnameHelper("\1\2\3\4\112\177", "%01%02%03%04j%7F"); TestHostnameHelper("<>.AS/-+", "<>.as/-+"); } void TestLongHostname() { static const int kTestSize = 1024 * 150; char *str = static_cast(malloc(kTestSize + 1)); memset(str, 'x', kTestSize); str[kTestSize] = '\0'; nsUrlClassifierUtils utils; utils.Init(); nsCAutoString out; nsDependentCString in(str); PRIntervalTime clockStart = PR_IntervalNow(); utils.CanonicalizeHostname(in, out); PRIntervalTime clockEnd = PR_IntervalNow(); CheckEquals(in, out); printf("CanonicalizeHostname on long string (%dms)\n", PR_IntervalToMilliseconds(clockEnd - clockStart)); } int main(int argc, char **argv) { NS_LogInit(); TestUnescape(); TestEnc(); TestCanonicalize(); TestCanonicalNum(); TestParseIPAddress(); TestHostname(); TestLongHostname(); printf("%d of %d tests passed\n", gPassedTests, gTotalTests); // Non-zero return status signals test failure to build system. return (gPassedTests != gTotalTests); }