commit 8b4a44be0f19d3a758d9b099627da6f50349119b
parent 6c88563ded7ca45f8d3ac5940bef00e48dcbca5a
Author: Simon Kornblith <simon@simonster.com>
Date: Fri, 30 Jun 2006 19:21:36 +0000
fixes a bug that made the Google Books translator not appear
adjusts the Google Books translator to work with the latest revision of the site
renames the MODS translator to just MODS, because "Metadata Object Description Schema (MODS)" was too long for the export dialog
Diffstat:
2 files changed, 7 insertions(+), 7 deletions(-)
diff --git a/chrome/chromeFiles/content/scholar/xpcom/ingester.js b/chrome/chromeFiles/content/scholar/xpcom/ingester.js
@@ -291,7 +291,7 @@ Scholar.Ingester.Document = function(myBrowser, myWindow, isHidden) {
Scholar.Ingester.Document.prototype.retrieveScraper = function() {
Scholar.debug("Retrieving scrapers for "+this.url);
- var sql = 'SELECT * FROM translators WHERE type = 3 ORDER BY detectCode IS NULL DESC';
+ var sql = 'SELECT * FROM translators WHERE type = 3 ORDER BY target IS NULL ASC';
var scrapers = Scholar.DB.query(sql);
for(var i=0; i<scrapers.length; i++) {
var currentScraper = scrapers[i];
diff --git a/scrapers.sql b/scrapers.sql
@@ -2324,7 +2324,7 @@ utilities.HTTPUtilities.doGet(newUri, null, function(text) {
wait();');
-REPLACE INTO "translators" VALUES ('951c027d-74ac-47d4-a107-9c3069ab7b48', '2006-06-26 16:41:00', 3, 'Generic Scraper', 'Simon Kornblith', '',
+REPLACE INTO "translators" VALUES ('951c027d-74ac-47d4-a107-9c3069ab7b48', '2006-06-26 16:41:00', 3, 'Generic Scraper', 'Simon Kornblith', NULL,
'return "website";',
'var prefixRDF = ''http://www.w3.org/1999/02/22-rdf-syntax-ns#'';
var prefixDC = ''http://purl.org/dc/elements/1.1/'';
@@ -2420,14 +2420,14 @@ utilities.processDocuments(browser, null, newUris, function(newBrowser) {
if (prefix == ''x'') return namespace; else return null;
} : null;
- var xpath = ''/html/body/table/tbody/tr[3]/td[2][@class="content"]/div[@class="content"]/table/tbody/tr/td/p[@class="e"]/table/tbody/tr'';
+ var xpath = ''//table[@id="bib"]/tbody/tr'';
var elmts = utilities.gatherElementsOnXPath(newDoc, newDoc, xpath, nsResolver);
for(var i = 0; i<elmts.length; i++) {
var field = utilities.getNode(newDoc, elmts[i], ''./td[1]//text()'', nsResolver);
var value = utilities.getNode(newDoc, elmts[i], ''./td[2]//text()'', nsResolver);
if(field && value) {
- field = utilities.cleanString(field.nodeValue);
+ field = utilities.superCleanString(field.nodeValue);
value = utilities.cleanString(value.nodeValue);
if(field == "Title") {
model.addStatement(uri, prefixDC + ''title'', value);
@@ -2464,7 +2464,7 @@ utilities.processDocuments(browser, null, newUris, function(newBrowser) {
wait();');
-REPLACE INTO "translators" VALUES ('0e2235e7-babf-413c-9acf-f27cce5f059c', '2006-06-28 16:00:00', 2, 'Metadata Object Description Schema (MODS)', 'Simon Kornblith', 'xml',
+REPLACE INTO "translators" VALUES ('0e2235e7-babf-413c-9acf-f27cce5f059c', '2006-06-28 16:00:00', 2, 'MODS', 'Simon Kornblith', 'xml',
'options.add("Export project structure", "checkbox", "true");
options.add("Export notes", "checkbox", "true");',
'var partialItemTypes = ["bookSection", "journalArticle", "magazineArticle", "newspaperArticle"];
@@ -2729,4 +2729,5 @@ function doExport(items) {
}
write(modsCollection.toString());
-}');
-\ No newline at end of file
+}');
+