summaryrefslogtreecommitdiff
path: root/src/modules/urlnormalizer/googleurl/GoogleURLNormalizer.cpp
diff options
context:
space:
mode:
authorAndreas Baumann <abaumann@yahoo.com>2014-07-25 09:28:51 +0200
committerAndreas Baumann <abaumann@yahoo.com>2014-07-25 09:28:51 +0200
commite53f13ccaa3a0b595351fc536bf1a6d6be805175 (patch)
treeecfb7df20e09841283776ca928fbe49f2428a22b /src/modules/urlnormalizer/googleurl/GoogleURLNormalizer.cpp
parentaea482c8b49e9c4fb5e07ee84d80106cdada9f96 (diff)
downloadcrawler-e53f13ccaa3a0b595351fc536bf1a6d6be805175.tar.gz
crawler-e53f13ccaa3a0b595351fc536bf1a6d6be805175.tar.bz2
we also have to normilze with query
Diffstat (limited to 'src/modules/urlnormalizer/googleurl/GoogleURLNormalizer.cpp')
-rwxr-xr-xsrc/modules/urlnormalizer/googleurl/GoogleURLNormalizer.cpp3
1 files changed, 2 insertions, 1 deletions
diff --git a/src/modules/urlnormalizer/googleurl/GoogleURLNormalizer.cpp b/src/modules/urlnormalizer/googleurl/GoogleURLNormalizer.cpp
index b09b1f3..c8e50a6 100755
--- a/src/modules/urlnormalizer/googleurl/GoogleURLNormalizer.cpp
+++ b/src/modules/urlnormalizer/googleurl/GoogleURLNormalizer.cpp
@@ -102,7 +102,8 @@ URL GoogleURLNormalizer::normalize( const URL url, const string s )
componentString( canonical, parsed.host ),
port,
componentString( canonical, parsed.path ),
- "", "" );
+ componentString( canonical, parsed.query ),
+ "" );
}
REGISTER_MODULE( "google_urlnormalizer", URLNormalizer, GoogleURLNormalizer )