www

Unnamed repository; edit this file 'description' to name the repository.
Log | Files | Refs | Submodules | README | LICENSE

commit e3d062a81968ed828d71bf451c1c311ce4742ff2
parent 2b5b65f4ddbe8d253509ed716f103c22469c8b66
Author: Simon Kornblith <simon@simonster.com>
Date:   Mon,  7 Aug 2006 01:49:56 +0000

fix inappropriately truncated field values in InnoPAC


Diffstat:
Mscrapers.sql | 7+++----
1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/scrapers.sql b/scrapers.sql @@ -1,7 +1,7 @@ --- 36 +-- 37 -- Set the following timestamp to the most recent scraper update date -REPLACE INTO "version" VALUES ('repository', STRFTIME('%s', '2006-08-06 19:14:00')); +REPLACE INTO "version" VALUES ('repository', STRFTIME('%s', '2006-08-06 21:45:00')); REPLACE INTO "translators" VALUES ('96b9f483-c44d-5784-cdad-ce21b984fe01', '2006-06-28 23:08:00', 4, 'Amazon.com Scraper', 'Simon Kornblith', '^http://www\.amazon\.com/(?:gp/(?:product|search)/|exec/obidos/search-handle-url/|s/)', 'function detect(doc, url) { @@ -656,7 +656,7 @@ function doWeb(doc, url) { } }'); -REPLACE INTO "translators" VALUES ('4fd6b89b-2316-2dc4-fd87-61a97dd941e8', '2006-06-28 22:52:00', 4, 'InnoPAC Scraper', 'Simon Kornblith', '^http://[^/]+/(?:search/|record=)', +REPLACE INTO "translators" VALUES ('4fd6b89b-2316-2dc4-fd87-61a97dd941e8', '2006-08-06 21:45:00', 4, 'InnoPAC Scraper', 'Simon Kornblith', '^http://[^/]+/(?:search/|record=)', 'function detect(doc, url) { // First, check to see if the URL alone reveals InnoPAC, since some sites don''t reveal the MARC button var matchRegexp = new RegExp(''^(http://[^/]+/search/[^/]+/[^/]+/1\%2C[^/]+/)frameset(.+)$''); @@ -730,7 +730,6 @@ REPLACE INTO "translators" VALUES ('4fd6b89b-2316-2dc4-fd87-61a97dd941e8', '2006 var linee = text.split("\n"); for (var i=0; i<linee.length; i++) { linee[i] = linee[i].replace(/\xA0|_|\t/g,'' ''); - linee[i] = Scholar.Utilities.cleanString(linee[i]); if (linee[i] == '''') continue; // jumps empty lines var replacer = record.subfield_delimiter+''$1''; linee[i] = linee[i].replace(/\|(.)/g,replacer);