sheetjs_sheetjs/modules/45_rtf.ts

104 lines
3.9 KiB
TypeScript
Raw Permalink Normal View History

2023-04-14 07:51:02 +00:00
import { WorkBook, WorkSheet, Range, CellObject, DenseSheet, SparseSheet, ParsingOptions, WritingOptions } from '../';
2022-07-08 22:31:08 +00:00
import type { utils } from "../";
2023-04-14 07:51:02 +00:00
type RawData = any;
2022-07-08 22:31:08 +00:00
declare var encode_cell: typeof utils.encode_cell;
declare var encode_range: typeof utils.encode_range;
declare var format_cell: typeof utils.format_cell;
declare var safe_decode_range: typeof utils.decode_range;
declare function sheet_to_workbook(s: WorkSheet, o?: any): WorkBook;
declare function cc2str(d: any): string;
declare function a2s(a: any): string;
declare var has_buf: boolean;
declare function Base64_decode(s: string): string;
declare function fuzzynum(s: string): number;
declare var RBErr: {[key: string]: number};
2022-07-08 22:31:08 +00:00
2023-04-14 07:51:02 +00:00
function rtf_to_sheet(d: RawData, opts: ParsingOptions): WorkSheet {
2022-07-08 22:31:08 +00:00
switch(opts.type) {
case 'base64': return rtf_to_sheet_str(Base64_decode(d), opts);
case 'binary': return rtf_to_sheet_str(d, opts);
case 'buffer': return rtf_to_sheet_str(has_buf && Buffer.isBuffer(d) ? d.toString('binary') : a2s(d), opts);
case 'array': return rtf_to_sheet_str(cc2str(d), opts);
}
throw new Error("Unrecognized type " + opts.type);
}
/* TODO: this is a stub */
2023-04-14 07:51:02 +00:00
function rtf_to_sheet_str(str: string, opts: ParsingOptions): WorkSheet {
2022-07-08 22:31:08 +00:00
var o = opts || {};
// ESBuild issue 2375
2022-10-24 01:05:59 +00:00
var ws: WorkSheet = {} as WorkSheet;
var dense = o.dense;
if(dense) ws["!data"] = [];
2022-07-08 22:31:08 +00:00
var rows = str_match_ng(str, "\\trowd", "\\row");
2022-07-08 22:31:08 +00:00
if(!rows) throw new Error("RTF missing table");
var range: Range = {s: {c:0, r:0}, e: {c:0, r:rows.length - 1}};
2022-10-24 01:05:59 +00:00
var row: CellObject[] = [];
2022-07-08 22:31:08 +00:00
rows.forEach(function(rowtf, R) {
2022-10-24 01:05:59 +00:00
if(dense) row = (ws as DenseSheet)["!data"][R] = [] as CellObject[];
2022-07-08 22:31:08 +00:00
var rtfre = /\\[\w\-]+\b/g;
var last_index = 0;
var res;
var C = -1;
var payload: string[] = [];
while((res = rtfre.exec(rowtf)) != null) {
var data = rowtf.slice(last_index, rtfre.lastIndex - res[0].length);
if(data.charCodeAt(0) == 0x20) data = data.slice(1);
if(data.length) payload.push(data);
switch(res[0]) {
case "\\cell":
++C;
if(payload.length) {
// TODO: value parsing, including codepage adjustments
var cell: CellObject = {v: payload.join(""), t:"s"};
if(cell.v == "TRUE" || cell.v == "FALSE") { cell.v = cell.v == "TRUE"; cell.t = "b"; }
else if(!isNaN(fuzzynum(cell.v as string))) { cell.t = 'n'; if(o.cellText !== false) cell.w = cell.v as string; cell.v = fuzzynum(cell.v as string); }
else if(RBErr[cell.v as string] != null) { cell.t = "e"; cell.w = cell.v as string; cell.v = RBErr[cell.v as string]; }
2022-10-24 01:05:59 +00:00
if(dense) row[C] = cell;
else (ws as SparseSheet)[encode_cell({r:R, c:C})] = cell;
2022-07-08 22:31:08 +00:00
}
payload = [];
break;
case "\\par": // NOTE: Excel serializes both "\r" and "\n" as "\\par"
payload.push("\n");
break;
}
last_index = rtfre.lastIndex;
}
if(C > range.e.c) range.e.c = C;
});
ws['!ref'] = encode_range(range);
return ws;
}
2023-04-14 07:51:02 +00:00
function rtf_to_workbook(d: RawData, opts: ParsingOptions): WorkBook {
2022-07-08 22:31:08 +00:00
var wb: WorkBook = sheet_to_workbook(rtf_to_sheet(d, opts), opts);
wb.bookType = "rtf";
return wb;
}
/* TODO: this is a stub */
2023-04-14 07:51:02 +00:00
function sheet_to_rtf(ws: WorkSheet, opts: WritingOptions): string {
2022-07-08 22:31:08 +00:00
var o: string[] = ["{\\rtf1\\ansi"];
if(!ws["!ref"]) return o[0] + "}";
var r = safe_decode_range(ws['!ref']), cell: CellObject;
2022-10-24 01:05:59 +00:00
var dense = ws["!data"] != null, row: CellObject[] = [];
2022-07-08 22:31:08 +00:00
for(var R = r.s.r; R <= r.e.r; ++R) {
o.push("\\trowd\\trautofit1");
for(var C = r.s.c; C <= r.e.c; ++C) o.push("\\cellx" + (C+1));
o.push("\\pard\\intbl");
2022-10-24 01:05:59 +00:00
if(dense) row = (ws as DenseSheet)["!data"][R] || ([] as CellObject[])
2022-07-08 22:31:08 +00:00
for(C = r.s.c; C <= r.e.c; ++C) {
var coord = encode_cell({r:R,c:C});
2022-10-24 01:05:59 +00:00
cell = dense ? row[C] : (ws as SparseSheet)[coord];
2022-07-08 22:31:08 +00:00
if(!cell || cell.v == null && (!cell.f || cell.F)) { o.push(" \\cell"); continue; }
o.push(" " + (cell.w || (format_cell(cell), cell.w) || "").replace(/[\r\n]/g, "\\par "));
o.push("\\cell");
}
o.push("\\pard\\intbl\\row");
}
return o.join("") + "}";
}