mirror of
https://github.com/mozilla/pdf.js.git
synced 2025-04-22 16:18:08 +02:00
XFA -- Add support for SOM expressions (#12983)
- specifications: http://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.364.2157&rep=rep1&type=pdf#page=87; - add a parser for SOM expressions; - add search functions to resolve those expressions; - search functions will be used to bind data into template.
This commit is contained in:
parent
fafe039849
commit
45329af926
3 changed files with 610 additions and 3 deletions
232
src/core/xfa/som.js
Normal file
232
src/core/xfa/som.js
Normal file
|
@ -0,0 +1,232 @@
|
|||
/* Copyright 2021 Mozilla Foundation
|
||||
*
|
||||
* Licensed under the Apache License, Version 2.0 (the "License");
|
||||
* you may not use this file except in compliance with the License.
|
||||
* You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
import {
|
||||
$getChildrenByClass,
|
||||
$getChildrenByName,
|
||||
$getParent,
|
||||
XFAObject,
|
||||
XFAObjectArray,
|
||||
} from "./xfa_object.js";
|
||||
import { warn } from "../../shared/util.js";
|
||||
|
||||
const namePattern = /^[^.[]+/;
|
||||
const indexPattern = /^[^\]]+/;
|
||||
const operators = {
|
||||
dot: 0,
|
||||
dotDot: 1,
|
||||
dotHash: 2,
|
||||
dotBracket: 3,
|
||||
dotParen: 4,
|
||||
};
|
||||
|
||||
const shortcuts = new Map([
|
||||
["$data", root => root.datasets.data],
|
||||
["$template", root => root.template],
|
||||
["$connectionSet", root => root.connectionSet],
|
||||
["$form", root => root.form],
|
||||
["$layout", root => root.layout],
|
||||
["$host", root => root.host],
|
||||
["$dataWindow", root => root.dataWindow],
|
||||
["$event", root => root.event],
|
||||
["!", root => root.datasets],
|
||||
["$xfa", root => root],
|
||||
["xfa", root => root],
|
||||
]);
|
||||
|
||||
const somCache = new WeakMap();
|
||||
|
||||
function parseIndex(index) {
|
||||
index = index.trim();
|
||||
if (index === "*") {
|
||||
return Infinity;
|
||||
}
|
||||
return parseInt(index, 10) || 0;
|
||||
}
|
||||
|
||||
function parseExpression(expr, dotDotAllowed) {
|
||||
let match = expr.match(namePattern);
|
||||
if (!match) {
|
||||
return null;
|
||||
}
|
||||
|
||||
let [name] = match;
|
||||
const parsed = [
|
||||
{
|
||||
name,
|
||||
cacheName: "." + name,
|
||||
index: 0,
|
||||
js: null,
|
||||
formCalc: null,
|
||||
operator: operators.dot,
|
||||
},
|
||||
];
|
||||
|
||||
let pos = name.length;
|
||||
|
||||
while (pos < expr.length) {
|
||||
const spos = pos;
|
||||
const char = expr.charAt(pos++);
|
||||
if (char === "[") {
|
||||
match = expr.slice(pos).match(indexPattern);
|
||||
if (!match) {
|
||||
warn("XFA - Invalid index in SOM expression");
|
||||
return null;
|
||||
}
|
||||
parsed[parsed.length - 1].index = parseIndex(match[0]);
|
||||
pos += match[0].length + 1;
|
||||
continue;
|
||||
}
|
||||
|
||||
let operator;
|
||||
switch (expr.charAt(pos)) {
|
||||
case ".":
|
||||
if (!dotDotAllowed) {
|
||||
return null;
|
||||
}
|
||||
pos++;
|
||||
operator = operators.dotDot;
|
||||
break;
|
||||
case "#":
|
||||
pos++;
|
||||
operator = operators.dotHash;
|
||||
break;
|
||||
case "[":
|
||||
// TODO: FormCalc expression so need to use the parser
|
||||
operator = operators.dotBracket;
|
||||
break;
|
||||
case "(":
|
||||
// TODO:
|
||||
// Javascript expression: should be a boolean operation with a path
|
||||
// so maybe we can have our own parser for that stuff or
|
||||
// maybe use the formcalc one.
|
||||
operator = operators.dotParen;
|
||||
break;
|
||||
default:
|
||||
operator = operators.dot;
|
||||
break;
|
||||
}
|
||||
|
||||
match = expr.slice(pos).match(namePattern);
|
||||
if (!match) {
|
||||
break;
|
||||
}
|
||||
|
||||
[name] = match;
|
||||
pos += name.length;
|
||||
parsed.push({
|
||||
name,
|
||||
cacheName: expr.slice(spos, pos),
|
||||
operator,
|
||||
index: 0,
|
||||
js: null,
|
||||
formCalc: null,
|
||||
});
|
||||
}
|
||||
return parsed;
|
||||
}
|
||||
|
||||
function searchNode(root, container, expr, dotDotAllowed = true) {
|
||||
const parsed = parseExpression(expr, dotDotAllowed);
|
||||
if (!parsed) {
|
||||
return null;
|
||||
}
|
||||
const fn = shortcuts.get(parsed[0].name);
|
||||
let i = 0;
|
||||
let isQualified;
|
||||
if (fn) {
|
||||
isQualified = true;
|
||||
root = [fn(root)];
|
||||
i = 1;
|
||||
} else {
|
||||
isQualified = container === null;
|
||||
root = [container || root];
|
||||
}
|
||||
|
||||
for (let ii = parsed.length; i < ii; i++) {
|
||||
const { name, cacheName, operator, index } = parsed[i];
|
||||
const nodes = [];
|
||||
for (const node of root) {
|
||||
if (!(node instanceof XFAObject)) {
|
||||
continue;
|
||||
}
|
||||
|
||||
let cached = somCache.get(node);
|
||||
if (!cached) {
|
||||
cached = new Map();
|
||||
somCache.set(node, cached);
|
||||
}
|
||||
|
||||
let children = cached.get(cacheName);
|
||||
if (!children) {
|
||||
switch (operator) {
|
||||
case operators.dot:
|
||||
children = node[$getChildrenByName](name, false);
|
||||
break;
|
||||
case operators.dotDot:
|
||||
children = node[$getChildrenByName](name, true);
|
||||
break;
|
||||
case operators.dotHash:
|
||||
children = node[$getChildrenByClass](name);
|
||||
if (children instanceof XFAObjectArray) {
|
||||
children = children.children;
|
||||
} else {
|
||||
children = [children];
|
||||
}
|
||||
break;
|
||||
default:
|
||||
break;
|
||||
}
|
||||
cached.set(cacheName, children);
|
||||
}
|
||||
|
||||
if (children.length > 0) {
|
||||
nodes.push(children);
|
||||
}
|
||||
}
|
||||
|
||||
if (nodes.length === 0 && !isQualified && i === 0) {
|
||||
// We've an unqualified expression and we didn't find anything
|
||||
// so look at container and siblings of container and so on.
|
||||
// http://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.364.2157&rep=rep1&type=pdf#page=114
|
||||
const parent = container[$getParent]();
|
||||
container = parent;
|
||||
if (!container) {
|
||||
return null;
|
||||
}
|
||||
i = -1;
|
||||
root = [container];
|
||||
continue;
|
||||
}
|
||||
|
||||
if (isFinite(index)) {
|
||||
root = nodes.filter(node => index < node.length).map(node => node[index]);
|
||||
} else {
|
||||
root = nodes.reduce((acc, node) => acc.concat(node), []);
|
||||
}
|
||||
}
|
||||
|
||||
if (root.length === 0) {
|
||||
return null;
|
||||
}
|
||||
|
||||
if (root.length === 1) {
|
||||
return root[0];
|
||||
}
|
||||
|
||||
return root;
|
||||
}
|
||||
|
||||
export { searchNode };
|
|
@ -24,7 +24,13 @@ const $cleanup = Symbol();
|
|||
const $content = Symbol("content");
|
||||
const $dump = Symbol();
|
||||
const $finalize = Symbol();
|
||||
const $isDataValue = Symbol();
|
||||
const $getAttributeIt = Symbol();
|
||||
const $getChildrenByClass = Symbol();
|
||||
const $getChildrenByName = Symbol();
|
||||
const $getChildrenByNameIt = Symbol();
|
||||
const $getChildren = Symbol();
|
||||
const $getParent = Symbol();
|
||||
const $isTransparent = Symbol();
|
||||
const $lastAttribute = Symbol();
|
||||
const $namespaceId = Symbol("namespaceId");
|
||||
|
@ -139,12 +145,16 @@ class XFAObject {
|
|||
return shadow(this, _attributeNames, proto._attributes);
|
||||
}
|
||||
|
||||
[$getParent]() {
|
||||
return this[_parent];
|
||||
}
|
||||
|
||||
[$getChildren](name = null) {
|
||||
if (!name) {
|
||||
return this[_children];
|
||||
}
|
||||
|
||||
return this[_children].filter(c => c[$nodeName] === name);
|
||||
return this[name];
|
||||
}
|
||||
|
||||
[$dump]() {
|
||||
|
@ -363,6 +373,47 @@ class XFAObject {
|
|||
|
||||
return clone;
|
||||
}
|
||||
|
||||
[$getChildren](name = null) {
|
||||
if (!name) {
|
||||
return this[_children];
|
||||
}
|
||||
|
||||
return this[_children].filter(c => c[$nodeName] === name);
|
||||
}
|
||||
|
||||
[$getChildrenByClass](name) {
|
||||
return this[name];
|
||||
}
|
||||
|
||||
[$getChildrenByName](name, allTransparent, first = true) {
|
||||
return Array.from(this[$getChildrenByNameIt](name, allTransparent, first));
|
||||
}
|
||||
|
||||
*[$getChildrenByNameIt](name, allTransparent, first = true) {
|
||||
if (name === "parent") {
|
||||
yield this[_parent];
|
||||
return;
|
||||
}
|
||||
|
||||
for (const child of this[_children]) {
|
||||
if (child[$nodeName] === name) {
|
||||
yield child;
|
||||
}
|
||||
|
||||
if (child.name === name) {
|
||||
yield child;
|
||||
}
|
||||
|
||||
if (allTransparent || child[$isTransparent]()) {
|
||||
yield* child[$getChildrenByNameIt](name, allTransparent, false);
|
||||
}
|
||||
}
|
||||
|
||||
if (first && this[_attributeNames].has(name)) {
|
||||
yield new XFAAttribute(this, name, this[name]);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
class XFAObjectArray {
|
||||
|
@ -398,10 +449,34 @@ class XFAObjectArray {
|
|||
clone[_children] = this[_children].map(c => c[_clone]());
|
||||
return clone;
|
||||
}
|
||||
|
||||
get children() {
|
||||
return this[_children];
|
||||
}
|
||||
}
|
||||
|
||||
class XFAAttribute {
|
||||
constructor(node, name, value) {
|
||||
this[_parent] = node;
|
||||
this[$nodeName] = name;
|
||||
this[$content] = value;
|
||||
}
|
||||
|
||||
[$getParent]() {
|
||||
return this[_parent];
|
||||
}
|
||||
|
||||
[$isDataValue]() {
|
||||
return true;
|
||||
}
|
||||
|
||||
[$text]() {
|
||||
return this[$content];
|
||||
}
|
||||
}
|
||||
|
||||
class XmlObject extends XFAObject {
|
||||
constructor(nsId, name, attributes = Object.create(null)) {
|
||||
constructor(nsId, name, attributes = null) {
|
||||
super(nsId, name);
|
||||
this[$content] = "";
|
||||
if (name !== "#text") {
|
||||
|
@ -412,6 +487,7 @@ class XmlObject extends XFAObject {
|
|||
[$onChild](child) {
|
||||
if (this[$content]) {
|
||||
const node = new XmlObject(this[$namespaceId], "#text");
|
||||
node[_parent] = this;
|
||||
node[$content] = this[$content];
|
||||
this[$content] = "";
|
||||
this[_children].push(node);
|
||||
|
@ -428,6 +504,7 @@ class XmlObject extends XFAObject {
|
|||
[$finalize]() {
|
||||
if (this[$content] && this[_children].length > 0) {
|
||||
const node = new XmlObject(this[$namespaceId], "#text");
|
||||
node[_parent] = this;
|
||||
node[$content] = this[$content];
|
||||
this[_children].push(node);
|
||||
delete this[$content];
|
||||
|
@ -440,6 +517,54 @@ class XmlObject extends XFAObject {
|
|||
}
|
||||
return this[_children].map(c => c[$text]()).join("");
|
||||
}
|
||||
|
||||
[$getChildren](name = null) {
|
||||
if (!name) {
|
||||
return this[_children];
|
||||
}
|
||||
|
||||
return this[_children].filter(c => c[$nodeName] === name);
|
||||
}
|
||||
|
||||
[$getChildrenByClass](name) {
|
||||
const value = this[_attributes][name];
|
||||
if (value !== undefined) {
|
||||
return value;
|
||||
}
|
||||
return this[$getChildren](name);
|
||||
}
|
||||
|
||||
*[$getChildrenByNameIt](name, allTransparent) {
|
||||
const value = this[_attributes][name];
|
||||
if (value !== undefined) {
|
||||
yield new XFAAttribute(this, name, value);
|
||||
}
|
||||
|
||||
for (const child of this[_children]) {
|
||||
if (child[$nodeName] === name) {
|
||||
yield child;
|
||||
}
|
||||
|
||||
if (allTransparent) {
|
||||
yield* child[$getChildrenByNameIt](name, allTransparent);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
*[$getAttributeIt](name) {
|
||||
const value = this[_attributes][name];
|
||||
if (value !== undefined) {
|
||||
yield new XFAAttribute(this, name, value);
|
||||
}
|
||||
|
||||
for (const child of this[_children]) {
|
||||
yield* child[$getAttributeIt](name);
|
||||
}
|
||||
}
|
||||
|
||||
[$isDataValue]() {
|
||||
return this[_children].length === 0;
|
||||
}
|
||||
}
|
||||
|
||||
class ContentObject extends XFAObject {
|
||||
|
@ -521,7 +646,13 @@ export {
|
|||
$content,
|
||||
$dump,
|
||||
$finalize,
|
||||
$getAttributeIt,
|
||||
$getChildren,
|
||||
$getChildrenByClass,
|
||||
$getChildrenByName,
|
||||
$getChildrenByNameIt,
|
||||
$getParent,
|
||||
$isDataValue,
|
||||
$isTransparent,
|
||||
$namespaceId,
|
||||
$nodeName,
|
||||
|
@ -538,6 +669,7 @@ export {
|
|||
Option10,
|
||||
OptionObject,
|
||||
StringObject,
|
||||
XFAAttribute,
|
||||
XFAObject,
|
||||
XFAObjectArray,
|
||||
XmlObject,
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue