HTML/RTF and RTF/HTML conversion for styled textbox
This commit is contained in:
parent
70c41e8a51
commit
9431e0de53
1 changed files with 310 additions and 99 deletions
|
@ -49,57 +49,317 @@
|
||||||
|
|
||||||
this._iframe = document.getAnonymousElementByAttribute(this, "anonid", "rt-view");
|
this._iframe = document.getAnonymousElementByAttribute(this, "anonid", "rt-view");
|
||||||
|
|
||||||
this._rtfMap = {
|
this._htmlRTFmap = [
|
||||||
"\\":"\\\\",
|
// Atomic units, HTML -> RTF (cleanup)
|
||||||
"<em>":"\\i ",
|
[/<br \/>/g, "\x0B"],
|
||||||
"</em>":"\\i0{}",
|
[/<span class=\"tab\"> <\/span>/g, "\\tab{}"],
|
||||||
"<i>":"\\i ",
|
[/‘/g, "‘"],
|
||||||
"</i>":"\\i0{}",
|
[/’/g, "’"],
|
||||||
"<strong>":"\\b ",
|
[/“/g, "“"],
|
||||||
"</strong>":"\\b0{}",
|
[/”/g, "”"],
|
||||||
"<b>":"\\b ",
|
[/ /g, "\u00A0"],
|
||||||
"</b>":"\\b0{}",
|
[/"(\w)/g, "“$1"],
|
||||||
"<br />":"\x0B",
|
[/([\w,.?!])"/g, "$1”"],
|
||||||
// there's no way to mimic a tab stop in CSS without
|
[/<p>/g, ""],
|
||||||
// tables, which wouldn't work here.
|
|
||||||
'<span class="tab"> </span>':"\\tab{}"
|
|
||||||
};
|
|
||||||
|
|
||||||
this._rtfToHtmlMap = [
|
|
||||||
[/\\uc0\{?\\u([0-9]+)\}?(?:{}| )?/g, function(wholeStr, aCode) { return String.fromCharCode(aCode) }],
|
|
||||||
[/\\tab(?:\{\}| )/g, '<span class="tab"> </span>'],
|
|
||||||
[/(?:\\par{}|\\\r?\n)/g, "</p><p>"],
|
|
||||||
[/\\super (.*?)\\nosupersub{}/g, "<sup>$1</sup>"],
|
|
||||||
[/\\sub (.*?)\\nosupersub{}/g, "<sub>$1</sub>"],
|
|
||||||
// for backwards compatibility with Zotero < 2.1
|
|
||||||
["\\i0 ", "</em>"],
|
|
||||||
["\\b0 ", "</strong>"]
|
|
||||||
];
|
|
||||||
|
|
||||||
this._htmlToRtfMap = [
|
|
||||||
[/"(\w)/, "“$1"],
|
|
||||||
[/([\w,.?!])"/, "$1”"],
|
|
||||||
["<p>", ""],
|
|
||||||
//[/<\/p>(?!\s*$)/g, "\\par{}"],
|
//[/<\/p>(?!\s*$)/g, "\\par{}"],
|
||||||
[/<\/?div[^>]*>/g, ""],
|
[/<\/?div[^>]*>/g, ""],
|
||||||
["<sup>", "\\super "],
|
//[/ /g, " "],
|
||||||
["</sup>", "\\nosupersub{}"],
|
//[/\u00A0/g, " "],
|
||||||
["<sub>", "\\sub "],
|
[/[\x7F-\uFFFF]/g, function(aChar) { return "\\uc0\\u"+aChar.charCodeAt(0).toString()+"{}"}]
|
||||||
["</sub>", "\\nosupersub{}"]
|
|
||||||
];
|
];
|
||||||
|
|
||||||
this._rtfRexMap = [
|
this._rtfHTMLmap = [
|
||||||
["<span style=\"font-variant:small-caps;\">",
|
// Atomic units, RTF -> HTML (cleanup)
|
||||||
/small-caps/,
|
[/\\uc0\{?\\u([0-9]+)\}?(?:{}| )?/g, function(wholeStr, aCode) { return String.fromCharCode(aCode) }],
|
||||||
"\\scaps ",
|
[/\\tab(?:\{\}| )/g, '<span class="tab"> </span>'],
|
||||||
"\\scaps0{}"
|
[/(?:\\par{}|\\\r?\n)/g, "</p><p>"]
|
||||||
],
|
];
|
||||||
["<span style=\"text-decoration:underline;\">",
|
|
||||||
/underline/,
|
this.init = function() {
|
||||||
"\\ul ",
|
if (this.initialized) return;
|
||||||
"\\ul0{}"
|
// Tag data
|
||||||
]
|
var _rexData = [
|
||||||
]
|
[
|
||||||
|
[
|
||||||
|
["<span style=\"font-variant:small-caps;\">"],
|
||||||
|
["{\\scaps ", "{\\scaps{}"]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
["<\/span>"],
|
||||||
|
["}"]
|
||||||
|
]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
[
|
||||||
|
["<span style=\"text-decoration:underline;\">"],
|
||||||
|
["{\\ul{}", "{\\ul "]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
["<\/span>"],
|
||||||
|
["}"]
|
||||||
|
]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
[
|
||||||
|
["<sup>"],
|
||||||
|
["\\super ", "\\super{}"]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
["</sup>"],
|
||||||
|
["\\nosupersub{}", "\\nosupersub "]
|
||||||
|
]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
[
|
||||||
|
["<sub>"],
|
||||||
|
["\\sub ", "\\sub{}"]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
["</sub>"],
|
||||||
|
["\\nosupersub{}", "\\nosupersub "]
|
||||||
|
]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
[
|
||||||
|
["<em>"],
|
||||||
|
["{\\i{}", "{\\i "]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
["</em>"],
|
||||||
|
["}"]
|
||||||
|
]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
[
|
||||||
|
["<i>"],
|
||||||
|
["{\\i{}", "{\\i "]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
["</i>"],
|
||||||
|
["}"]
|
||||||
|
]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
[
|
||||||
|
["<b>"],
|
||||||
|
["{\\b{}", "{\\b "]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
["</b>"],
|
||||||
|
["}"]
|
||||||
|
]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
[
|
||||||
|
["<strong>"],
|
||||||
|
["{\\b{}", "{\\b "]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
["</strong>"],
|
||||||
|
["}"]
|
||||||
|
]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
[
|
||||||
|
["<span style=\"font-variant:normal;\">"],
|
||||||
|
["{\\scaps0{}", "{\\scaps0 "]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
["</span>"],
|
||||||
|
["}"]
|
||||||
|
]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
[
|
||||||
|
["<span style=\"font-style:normal;\">"],
|
||||||
|
["{\\i0{}", "{\\i0 "]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
["</span>"],
|
||||||
|
["}"]
|
||||||
|
]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
[
|
||||||
|
["<span style=\"font-weight:normal;\">"],
|
||||||
|
["{\\b0{}", "{\\b0 "]
|
||||||
|
],
|
||||||
|
[
|
||||||
|
["</span>"],
|
||||||
|
["}"]
|
||||||
|
]
|
||||||
|
]
|
||||||
|
];
|
||||||
|
|
||||||
|
function longestFirst(a, b) {
|
||||||
|
if (a.length < b.length) {
|
||||||
|
return 1;
|
||||||
|
} else if (a.length > b.length) {
|
||||||
|
return -1;
|
||||||
|
} else {
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
function composeRex(rexes, noGlobal) {
|
||||||
|
var lst = [];
|
||||||
|
for (var rex in rexes) {
|
||||||
|
lst.push(rex);
|
||||||
|
}
|
||||||
|
lst.sort(longestFirst);
|
||||||
|
var rexStr = "(?:" + lst.join("|") + ")";
|
||||||
|
return new RegExp(rexStr, "g");
|
||||||
|
}
|
||||||
|
|
||||||
|
// Create splitting regexps
|
||||||
|
function splitRexMaker(segment) {
|
||||||
|
var rexes = {};
|
||||||
|
for (var i=0,ilen=_rexData.length; i < ilen; i++) {
|
||||||
|
for (var j=0,jlen=_rexData[i].length; j < jlen; j++) {
|
||||||
|
for (var k=0,klen=_rexData[i][j][segment].length; k < klen; k++) {
|
||||||
|
rexes[_rexData[i][j][segment][k].replace("\\", "\\\\")] = true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
var ret = composeRex(rexes, true);
|
||||||
|
return ret;
|
||||||
|
}
|
||||||
|
this.rtfHTMLsplitRex = splitRexMaker(1);
|
||||||
|
this.htmlRTFsplitRex = splitRexMaker(0);
|
||||||
|
|
||||||
|
// Create open-tag sniffing regexp
|
||||||
|
function openSniffRexMaker(segment) {
|
||||||
|
var rexes = {};
|
||||||
|
for (var i=0,ilen=_rexData.length; i < ilen; i++) {
|
||||||
|
for (var j=0,jlen=_rexData[i][0][segment].length; j < jlen; j++) {
|
||||||
|
rexes[_rexData[i][0][segment][j].replace("\\", "\\\\")] = true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return composeRex(rexes);
|
||||||
|
}
|
||||||
|
this.rtfHTMLopenSniffRex = openSniffRexMaker(1);
|
||||||
|
this.htmlRTFopenSniffRex = openSniffRexMaker(0);
|
||||||
|
|
||||||
|
// Create open-tag remapper
|
||||||
|
function openTagRemapMaker(segment) {
|
||||||
|
var ret = {};
|
||||||
|
for (var i=0,ilen=_rexData.length; i < ilen; i++) {
|
||||||
|
var master = _rexData[i][0][segment][0];
|
||||||
|
for (var j=0,jlen=_rexData[i][0][segment].length; j < jlen; j++) {
|
||||||
|
ret[_rexData[i][0][segment][j]] = master;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return ret;
|
||||||
|
}
|
||||||
|
this.rtfHTMLopenTagRemap = openTagRemapMaker(1);
|
||||||
|
this.htmlRTFopenTagRemap = openTagRemapMaker(0);
|
||||||
|
|
||||||
|
// Create open-tag-keyed close-tag sniffing regexps
|
||||||
|
function closeTagRexMaker(segment) {
|
||||||
|
var ret = {};
|
||||||
|
var rexes = {};
|
||||||
|
for (var i=0,ilen=_rexData.length; i < ilen; i++) {
|
||||||
|
var master = _rexData[i][0][segment][0];
|
||||||
|
for (var j=0,jlen=_rexData[i][1][segment].length; j < jlen; j++) {
|
||||||
|
rexes[_rexData[i][1][segment][j]] = true;
|
||||||
|
}
|
||||||
|
ret[master] = composeRex(rexes);
|
||||||
|
}
|
||||||
|
return ret;
|
||||||
|
}
|
||||||
|
this.rtfHTMLcloseTagRex = closeTagRexMaker(1);
|
||||||
|
this.htmlRTFcloseTagRex = closeTagRexMaker(0);
|
||||||
|
|
||||||
|
// Create open-tag-keyed open/close tag registry
|
||||||
|
function tagRegistryMaker(segment) {
|
||||||
|
var antisegment = 1;
|
||||||
|
if (segment == 1) {
|
||||||
|
antisegment = 0;
|
||||||
|
}
|
||||||
|
var ret = {};
|
||||||
|
for (var i=0,ilen=_rexData.length; i < ilen; i++) {
|
||||||
|
var master = _rexData[i][0][segment][0];
|
||||||
|
ret[master] = {
|
||||||
|
open: _rexData[i][0][antisegment][0],
|
||||||
|
close: _rexData[i][1][antisegment][0]
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return ret;
|
||||||
|
}
|
||||||
|
this.rtfHTMLtagRegistry = tagRegistryMaker(1);
|
||||||
|
this.htmlRTFtagRegistry = tagRegistryMaker(0);
|
||||||
|
|
||||||
|
this.initialized = true;
|
||||||
|
}
|
||||||
|
this.init();
|
||||||
|
|
||||||
|
this.getSplit = function(mode, txt) {
|
||||||
|
if (!txt) return [];
|
||||||
|
var splt = txt.split(this[mode + "splitRex"]);
|
||||||
|
var mtch = txt.match(this[mode + "splitRex"]);
|
||||||
|
var lst = [splt[0]];
|
||||||
|
for (var i=1,ilen=splt.length; i < ilen; i++) {
|
||||||
|
lst.push(mtch[i-1]);
|
||||||
|
lst.push(splt[i]);
|
||||||
|
}
|
||||||
|
return lst;
|
||||||
|
}
|
||||||
|
|
||||||
|
this.getOpenTag = function(mode, str) {
|
||||||
|
var m = str.match(this[mode + "openSniffRex"]);
|
||||||
|
if (m) {
|
||||||
|
m = this[mode + "openTagRemap"][m[0]];
|
||||||
|
}
|
||||||
|
return m;
|
||||||
|
}
|
||||||
|
|
||||||
|
this.convert = function(mode, txt) {
|
||||||
|
var lst = this.getSplit(mode, txt);
|
||||||
|
var sdepth = 0;
|
||||||
|
var depth = 0;
|
||||||
|
for (var i=1,ilen=lst.length; i < ilen; i += 2) {
|
||||||
|
var openTag = this.getOpenTag(mode, lst[i]);
|
||||||
|
if (openTag) {
|
||||||
|
sdepth++;
|
||||||
|
depth = sdepth;
|
||||||
|
for (var j=(i+2),jlen=lst.length; j < jlen; j += 2) {
|
||||||
|
var closeTag = !this.getOpenTag(mode, lst[j]);
|
||||||
|
if (closeTag) {
|
||||||
|
if (depth === sdepth && lst[j].match(this[mode + "closeTagRex"][openTag])) {
|
||||||
|
lst[i] = this[mode + "tagRegistry"][openTag].open;
|
||||||
|
lst[j] = this[mode + "tagRegistry"][openTag].close;
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
depth--;
|
||||||
|
} else {
|
||||||
|
depth++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
sdepth--;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return lst.join("");
|
||||||
|
}
|
||||||
|
|
||||||
|
this.htmlToRTF = function(txt) {
|
||||||
|
txt = this.convert("htmlRTF", txt);
|
||||||
|
for (var i=0,ilen=this._htmlRTFmap.length; i < ilen; i++) {
|
||||||
|
var entry = this._htmlRTFmap[i];
|
||||||
|
txt = txt.replace(entry[0], entry[1]);
|
||||||
|
}
|
||||||
|
txt = Zotero.Utilities.unescapeHTML(txt);
|
||||||
|
return txt.trim();
|
||||||
|
}
|
||||||
|
|
||||||
|
this.rtfToHTML = function(txt) {
|
||||||
|
for (var i=0,ilen=this._rtfHTMLmap.length; i < ilen; i++) {
|
||||||
|
var entry = this._rtfHTMLmap[i];
|
||||||
|
txt = txt.replace(entry[0], entry[1]);
|
||||||
|
}
|
||||||
|
txt = this.convert("rtfHTML", txt);
|
||||||
|
return txt;
|
||||||
|
}
|
||||||
|
|
||||||
this._constructed = true;
|
this._constructed = true;
|
||||||
|
|
||||||
|
@ -213,7 +473,6 @@
|
||||||
<!-- Sets or returns contents of rich text box -->
|
<!-- Sets or returns contents of rich text box -->
|
||||||
<property name="value">
|
<property name="value">
|
||||||
<getter><![CDATA[
|
<getter><![CDATA[
|
||||||
const highcharRe = /[\x7F-\uFFFF]/g;
|
|
||||||
var output = this._editor.getContent();
|
var output = this._editor.getContent();
|
||||||
|
|
||||||
if(this._format == "RTF") {
|
if(this._format == "RTF") {
|
||||||
|
@ -221,44 +480,7 @@
|
||||||
if(output.substr(0, 5) == "<div>" && output.substr(-6) == "</div>") {
|
if(output.substr(0, 5) == "<div>" && output.substr(-6) == "</div>") {
|
||||||
output = output.substr(5, output.length-6);
|
output = output.substr(5, output.length-6);
|
||||||
}
|
}
|
||||||
|
output = this.htmlToRTF(output)
|
||||||
// do appropriate replacement operations
|
|
||||||
for(var needle in this._rtfMap) {
|
|
||||||
output = output.replace(needle, this._rtfMap[needle], "g");
|
|
||||||
}
|
|
||||||
|
|
||||||
// Preserve small caps and underlining
|
|
||||||
for each (var tagspec in this._rtfRexMap){
|
|
||||||
var l = output.split(/(<\/?span[^>]*>)/);
|
|
||||||
var current_level = 0;
|
|
||||||
var tag_level = [];
|
|
||||||
for (var pos=1; pos<l.length; pos+=2) {
|
|
||||||
var tag = l[pos];
|
|
||||||
if (tag[1] == "/") {
|
|
||||||
current_level--;
|
|
||||||
if (current_level == tag_level[tag_level.length-1]) {
|
|
||||||
tag_level.pop();
|
|
||||||
l[pos] = tagspec[3];
|
|
||||||
}
|
|
||||||
} else {
|
|
||||||
if (l[pos].match(tagspec[1])) {
|
|
||||||
l[pos] = tagspec[2];
|
|
||||||
tag_level.push(current_level);
|
|
||||||
}
|
|
||||||
current_level++;
|
|
||||||
};
|
|
||||||
};
|
|
||||||
output = l.join("");
|
|
||||||
}
|
|
||||||
|
|
||||||
for each(var entry in this._htmlToRtfMap) {
|
|
||||||
output = output.replace(entry[0], entry[1], "g");
|
|
||||||
}
|
|
||||||
|
|
||||||
output = Zotero.Utilities.unescapeHTML(output.replace(" ", " ", "g"))
|
|
||||||
.replace("\u00A0", " ", "g")
|
|
||||||
.replace(highcharRe, function(aChar) { return "\\uc0\\u"+aChar.charCodeAt(0).toString()+"{}" });
|
|
||||||
output = Zotero.Utilities.trim(output);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
return output;
|
return output;
|
||||||
|
@ -313,19 +535,8 @@
|
||||||
bodyStyle = "margin-left:"+(li/20+6)+"pt;text-indent:"+(fi/20)+"pt;";
|
bodyStyle = "margin-left:"+(li/20+6)+"pt;text-indent:"+(fi/20)+"pt;";
|
||||||
}
|
}
|
||||||
|
|
||||||
// do appropriate replacement operations
|
html = this.rtfToHTML(html);
|
||||||
for(var needle in this._rtfMap) {
|
|
||||||
if(this._rtfMap[needle]) {
|
|
||||||
html = html.replace(this._rtfMap[needle], needle, "g");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
for each (var tagspec in this._rtfRexMap){
|
|
||||||
html = html.replace(tagspec[2], tagspec[0], "g");
|
|
||||||
html = html.replace(tagspec[3], "</span>", "g");
|
|
||||||
}
|
|
||||||
for each(var entry in this._rtfToHtmlMap) {
|
|
||||||
html = html.replace(entry[0], entry[1], "g");
|
|
||||||
}
|
|
||||||
html = '<div style="'+bodyStyle+'"><p>'+html+"</p></div>";
|
html = '<div style="'+bodyStyle+'"><p>'+html+"</p></div>";
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
Loading…
Reference in a new issue