Normalize records imported from Z39.50 servers.

author Frédérick Capovilla <frederick.capovilla@libeo.com>

Wed, 28 Sep 2011 17:58:14 +0000 (13:58 -0400)

committer Paul Poulain <paul.poulain@biblibre.com>

Mon, 8 Oct 2012 16:46:56 +0000 (18:46 +0200)
author Frédérick Capovilla <frederick.capovilla@libeo.com>
Wed, 28 Sep 2011 17:58:14 +0000 (13:58 -0400)
committer Paul Poulain <paul.poulain@biblibre.com>
Mon, 8 Oct 2012 16:46:56 +0000 (18:46 +0200)
diff --git a/C4/Breeding.pm b/C4/Breeding.pm

index ea3e902..9dedc4d 100644 (file)
--- a/C4/Breeding.pm
+++ b/C4/Breeding.pm
@@ -94,6 +94,9 @@ sub ImportBreeding {
          ($marcrecord, $charset_result, $charset_errors) = 
              MarcToUTF8Record($marcarray[$i]."\x1D", C4::Context->preference("marcflavour"), $encoding);
          
+        # Normalize the record so it doesn't have separated diacritics
+        SetUTF8Flag($marcrecord);
+
  #         warn "$i : $marcarray[$i]";
          # FIXME - currently this does nothing 
          my @warnings = $marcrecord->warnings();
diff --git a/C4/ImportBatch.pm b/C4/ImportBatch.pm

index 648d96e..15f1acb 100644 (file)
--- a/C4/ImportBatch.pm
+++ b/C4/ImportBatch.pm
@@ -382,6 +382,10 @@ sub  BatchStageMarcRecords {
          if (scalar($marc_record->fields()) == 0) {
              push @invalid_records, $marc_blob;
          } else {
+
+            # Normalize the record so it doesn't have separated diacritics
+            SetUTF8Flag($marc_record);
+
              $num_valid++;
              if ($record_type eq 'biblio') {
                  $import_record_id = AddBiblioToBatch($batch_id, $rec_num, $marc_record, $encoding, int(rand(99999)), 0);
diff --git a/acqui/z3950_search.pl b/acqui/z3950_search.pl

index a1cdce4..8da89b6 100755 (executable)
--- a/acqui/z3950_search.pl
+++ b/acqui/z3950_search.pl
@@ -281,6 +281,10 @@ warn "query ".$query  if $DEBUG;
  ## In HEAD i change everything to UTF-8
  # In rel2_2 i am not sure what encoding is so no character conversion is done here
  ##Add necessary encoding changes to here -TG
+
+                        # Normalize the record so it doesn't have separated diacritics
+                        SetUTF8Flag($marcrecord);
+
                          my $oldbiblio = TransformMarcToKoha( $dbh, $marcrecord, "" );
                          $oldbiblio->{isbn}   =~ s/ |-|\.//g if $oldbiblio->{isbn};
                          # pad | and ( with spaces to allow line breaks in the HTML
diff --git a/cataloguing/z3950_search.pl b/cataloguing/z3950_search.pl

index 5e22636..fe07a7d 100755 (executable)
--- a/cataloguing/z3950_search.pl
+++ b/cataloguing/z3950_search.pl
@@ -249,6 +249,10 @@ warn "query ".$query  if $DEBUG;
  ## In HEAD i change everything to UTF-8
  # In rel2_2 i am not sure what encoding is so no character conversion is done here
  ##Add necessary encoding changes to here -TG
+
+                        # Normalize the record so it doesn't have separated diacritics
+                        SetUTF8Flag($marcrecord);
+
                          my $oldbiblio = TransformMarcToKoha( $dbh, $marcrecord, "" );
                          $oldbiblio->{isbn}   =~ s/ |-|\.//g if $oldbiblio->{isbn};
                          # pad | and ( with spaces to allow line breaks in the HTML
author	Frédérick Capovilla <frederick.capovilla@libeo.com>
	Wed, 28 Sep 2011 17:58:14 +0000 (13:58 -0400)
committer	Paul Poulain <paul.poulain@biblibre.com>
	Mon, 8 Oct 2012 16:46:56 +0000 (18:46 +0200)
C4/Breeding.pm		patch \| blob \| history
C4/ImportBatch.pm		patch \| blob \| history
acqui/z3950_search.pl		patch \| blob \| history
cataloguing/z3950_search.pl		patch \| blob \| history