commit 1374cc911aa727d88f3bbe0d39eddf219f3fc6dd
parent 46ff2f464d974e203869b110e66f25df438f1ffb
Author: Aurimas Vinckevicius <aurimas.dev@gmail.com>
Date: Thu, 11 Jun 2015 18:25:32 -0500
Always save snapshots in UTF-8 encoding
Re https://forums.zotero.org/discussion/49897/thecreate-web-page-item-from-current-pageis-sometimes-not-working-correctly/
There is something wrong with the way nsIScriptableUnicodeConverter converts to gbk (maybe other formats too). The HTML of http://www.cmiw.cn/forum.php is truncated in the middle of an em tag. In general, ConvertFromUnicode is supposed to return an ACString (not AString), which is not something that JavaScript can handle well.
Diffstat:
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/chrome/content/zotero/webpagedump/domsaver.js b/chrome/content/zotero/webpagedump/domsaver.js
@@ -199,7 +199,7 @@ var wpdDOMSaver = {
// Changed by Dan for Zotero
"script": true, // no scripts
- "encodeUTF8": false, // write the DOM Tree as UTF-8 and change the charset entry of the document
+ "encodeUTF8": true, // write the DOM Tree as UTF-8 and change the charset entry of the document
"metainfo": true, // include meta tags with URL and date/time information
"metacharset": false // if the meta charset is defined inside html override document charset
//"xtagging" : true // include a x tag around each word