Move the decode_utf8() call for various feeds to entityize()

author dbs <dbs@dcc99617-32d9-48b4-a31d-7c20da2025e4>

Thu, 14 Jan 2010 04:54:48 +0000 (04:54 +0000)

committer dbs <dbs@dcc99617-32d9-48b4-a31d-7c20da2025e4>

Thu, 14 Jan 2010 04:54:48 +0000 (04:54 +0000)
author dbs <dbs@dcc99617-32d9-48b4-a31d-7c20da2025e4>
Thu, 14 Jan 2010 04:54:48 +0000 (04:54 +0000)
committer dbs <dbs@dcc99617-32d9-48b4-a31d-7c20da2025e4>
Thu, 14 Jan 2010 04:54:48 +0000 (04:54 +0000)
diff --git a/Open-ILS/src/perlmods/OpenILS/Application/AppUtils.pm b/Open-ILS/src/perlmods/OpenILS/Application/AppUtils.pm

index 55546dc..b96521c 100644 (file)
--- a/Open-ILS/src/perlmods/OpenILS/Application/AppUtils.pm
+++ b/Open-ILS/src/perlmods/OpenILS/Application/AppUtils.pm
@@ -14,6 +14,7 @@ use OpenILS::Const qw/:const/;
  use Unicode::Normalize;
  use OpenSRF::Utils::SettingsClient;
  use UUID::Tiny;
+use Encode;
  
  # ---------------------------------------------------------------------------
  # Pile of utilty methods used accross applications.
@@ -1485,6 +1486,10 @@ sub entityize {
      my($self, $string, $form) = @_;
         $form ||= "";
  
+       # If we're going to convert non-ASCII characters to XML entities,
+       # we had better be dealing with a UTF8 string to begin with
+       $string = decode_utf8($string);
+
         if ($form eq 'D') {
                 $string = NFD($string);
         } else {
diff --git a/Open-ILS/src/perlmods/OpenILS/WWW/SuperCat.pm b/Open-ILS/src/perlmods/OpenILS/WWW/SuperCat.pm

index 4418c72..71ced48 100644 (file)
--- a/Open-ILS/src/perlmods/OpenILS/WWW/SuperCat.pm
+++ b/Open-ILS/src/perlmods/OpenILS/WWW/SuperCat.pm
@@ -874,7 +874,7 @@ sub bookbag_feed {
  
  
         print "Content-type: ". $feed->type ."; charset=utf-8\n\n";
-       print $U->entityize(decode_utf8($feed->toString)) . "\n";
+       print $U->entityize($feed->toString) . "\n";
  
         return Apache2::Const::OK;
  }
@@ -951,7 +951,7 @@ sub changes_feed {
  
  
         print "Content-type: ". $feed->type ."; charset=utf-8\n\n";
-       print $U->entityize(decode_utf8($feed->toString)) . "\n";
+       print $U->entityize($feed->toString) . "\n";
  
         return Apache2::Const::OK;
  }
@@ -1676,8 +1676,13 @@ sub sru_search {
         my ($shortname, $holdings) = $url =~ m#/?([^/]*)(/holdings)?#;
  
         if ( $resp->type eq 'searchRetrieve' ) {
-               my $cql_query = decode_utf8($req->query);
-               my $search_string = decode_utf8($req->cql->toEvergreen);
+
+               # These terms are arriving to us double-encoded, so until we
+               # figure out where in the CGI/SRU chain that's happening, we
+               # have to # forcefully double-decode them a second time with
+               # the outer decode('utf8', $string) call
+               my $cql_query = decode('utf8', decode_utf8($req->query));
+               my $search_string = decode('utf8', decode_utf8($req->cql->toEvergreen));
  
                 # Ensure the search string overrides the default site
                 if ($shortname and $search_string !~ m#site:#) {
author	dbs <dbs@dcc99617-32d9-48b4-a31d-7c20da2025e4>
	Thu, 14 Jan 2010 04:54:48 +0000 (04:54 +0000)
committer	dbs <dbs@dcc99617-32d9-48b4-a31d-7c20da2025e4>
	Thu, 14 Jan 2010 04:54:48 +0000 (04:54 +0000)
Open-ILS/src/perlmods/OpenILS/Application/AppUtils.pm		patch \| blob \| history
Open-ILS/src/perlmods/OpenILS/WWW/SuperCat.pm		patch \| blob \| history