2012-09-01 07:48:21 +09:00
|
|
|
/* Copyright 2012 Mozilla Foundation
|
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
import { warn } from '../shared/util';
|
|
|
|
|
|
|
|
// Character types for symbols from 0000 to 00FF.
|
|
|
|
// Source: ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.txt
|
2019-12-25 23:54:34 +09:00
|
|
|
// prettier-ignore
|
2017-04-02 23:14:30 +09:00
|
|
|
var baseTypes = [
|
|
|
|
'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'S', 'B', 'S',
|
|
|
|
'WS', 'B', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN',
|
|
|
|
'BN', 'BN', 'BN', 'BN', 'B', 'B', 'B', 'S', 'WS', 'ON', 'ON', 'ET',
|
|
|
|
'ET', 'ET', 'ON', 'ON', 'ON', 'ON', 'ON', 'ES', 'CS', 'ES', 'CS', 'CS',
|
|
|
|
'EN', 'EN', 'EN', 'EN', 'EN', 'EN', 'EN', 'EN', 'EN', 'EN', 'CS', 'ON',
|
|
|
|
'ON', 'ON', 'ON', 'ON', 'ON', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L',
|
|
|
|
'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L',
|
|
|
|
'L', 'L', 'L', 'L', 'ON', 'ON', 'ON', 'ON', 'ON', 'ON', 'L', 'L', 'L',
|
|
|
|
'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L',
|
|
|
|
'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'ON', 'ON', 'ON', 'ON',
|
|
|
|
'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'B', 'BN', 'BN', 'BN', 'BN', 'BN',
|
|
|
|
'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN',
|
|
|
|
'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'BN', 'CS', 'ON', 'ET',
|
|
|
|
'ET', 'ET', 'ET', 'ON', 'ON', 'ON', 'ON', 'L', 'ON', 'ON', 'BN', 'ON',
|
|
|
|
'ON', 'ET', 'ET', 'EN', 'EN', 'ON', 'L', 'ON', 'ON', 'ON', 'EN', 'L',
|
|
|
|
'ON', 'ON', 'ON', 'ON', 'ON', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L',
|
|
|
|
'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L',
|
|
|
|
'L', 'ON', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L',
|
|
|
|
'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L',
|
|
|
|
'L', 'L', 'L', 'L', 'L', 'ON', 'L', 'L', 'L', 'L', 'L', 'L', 'L', 'L'
|
|
|
|
];
|
|
|
|
|
|
|
|
// Character types for symbols from 0600 to 06FF.
|
|
|
|
// Source: ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.txt
|
|
|
|
// Note that 061D does not exist in the Unicode standard (see
|
|
|
|
// http://unicode.org/charts/PDF/U0600.pdf), so we replace it with an
|
|
|
|
// empty string and issue a warning if we encounter this character. The
|
|
|
|
// empty string is required to properly index the items after it.
|
2019-12-25 23:54:34 +09:00
|
|
|
// prettier-ignore
|
2017-04-02 23:14:30 +09:00
|
|
|
var arabicTypes = [
|
|
|
|
'AN', 'AN', 'AN', 'AN', 'AN', 'AN', 'ON', 'ON', 'AL', 'ET', 'ET', 'AL',
|
|
|
|
'CS', 'AL', 'ON', 'ON', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM',
|
|
|
|
'NSM', 'NSM', 'NSM', 'NSM', 'AL', 'AL', '', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM',
|
|
|
|
'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM',
|
|
|
|
'NSM', 'NSM', 'NSM', 'NSM', 'AN', 'AN', 'AN', 'AN', 'AN', 'AN', 'AN',
|
|
|
|
'AN', 'AN', 'AN', 'ET', 'AN', 'AN', 'AL', 'AL', 'AL', 'NSM', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL',
|
|
|
|
'AL', 'AL', 'AL', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'AN',
|
|
|
|
'ON', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'NSM', 'AL', 'AL', 'NSM', 'NSM',
|
|
|
|
'ON', 'NSM', 'NSM', 'NSM', 'NSM', 'AL', 'AL', 'EN', 'EN', 'EN', 'EN',
|
|
|
|
'EN', 'EN', 'EN', 'EN', 'EN', 'EN', 'AL', 'AL', 'AL', 'AL', 'AL', 'AL'
|
|
|
|
];
|
|
|
|
|
|
|
|
function isOdd(i) {
|
|
|
|
return (i & 1) !== 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
function isEven(i) {
|
|
|
|
return (i & 1) === 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
function findUnequal(arr, start, value) {
|
|
|
|
for (var j = start, jj = arr.length; j < jj; ++j) {
|
|
|
|
if (arr[j] !== value) {
|
|
|
|
return j;
|
|
|
|
}
|
2015-11-22 01:32:47 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
return j;
|
|
|
|
}
|
|
|
|
|
|
|
|
function setValues(arr, start, end, value) {
|
|
|
|
for (var j = start; j < end; ++j) {
|
|
|
|
arr[j] = value;
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
function reverseValues(arr, start, end) {
|
|
|
|
for (var i = start, j = end - 1; i < j; ++i, --j) {
|
|
|
|
var temp = arr[i];
|
|
|
|
arr[i] = arr[j];
|
|
|
|
arr[j] = temp;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
function createBidiText(str, isLTR, vertical) {
|
|
|
|
return {
|
|
|
|
str,
|
Fix inconsistent spacing and trailing commas in objects in `src/core/` files, so we can enable the `comma-dangle` and `object-curly-spacing` ESLint rules later on
*Unfortunately this patch is fairly big, even though it only covers the `src/core` folder, but splitting it even further seemed difficult.*
http://eslint.org/docs/rules/comma-dangle
http://eslint.org/docs/rules/object-curly-spacing
Given that we currently have quite inconsistent object formatting, fixing this in *one* big patch probably wouldn't be feasible (since I cannot imagine anyone wanting to review that); hence I've opted to try and do this piecewise instead.
Please note: This patch was created automatically, using the ESLint --fix command line option. In a couple of places this caused lines to become too long, and I've fixed those manually; please refer to the interdiff below for the only hand-edits in this patch.
```diff
diff --git a/src/core/evaluator.js b/src/core/evaluator.js
index abab9027..dcd3594b 100644
--- a/src/core/evaluator.js
+++ b/src/core/evaluator.js
@@ -2785,7 +2785,8 @@ var EvaluatorPreprocessor = (function EvaluatorPreprocessorClosure() {
t['Tz'] = { id: OPS.setHScale, numArgs: 1, variableArgs: false, };
t['TL'] = { id: OPS.setLeading, numArgs: 1, variableArgs: false, };
t['Tf'] = { id: OPS.setFont, numArgs: 2, variableArgs: false, };
- t['Tr'] = { id: OPS.setTextRenderingMode, numArgs: 1, variableArgs: false, };
+ t['Tr'] = { id: OPS.setTextRenderingMode, numArgs: 1,
+ variableArgs: false, };
t['Ts'] = { id: OPS.setTextRise, numArgs: 1, variableArgs: false, };
t['Td'] = { id: OPS.moveText, numArgs: 2, variableArgs: false, };
t['TD'] = { id: OPS.setLeadingMoveText, numArgs: 2, variableArgs: false, };
diff --git a/src/core/jbig2.js b/src/core/jbig2.js
index 5a17d482..71671541 100644
--- a/src/core/jbig2.js
+++ b/src/core/jbig2.js
@@ -123,19 +123,22 @@ var Jbig2Image = (function Jbig2ImageClosure() {
{ x: -1, y: -1, }, { x: 0, y: -1, }, { x: 1, y: -1, }, { x: -2, y: 0, },
{ x: -1, y: 0, }],
[{ x: -3, y: -1, }, { x: -2, y: -1, }, { x: -1, y: -1, }, { x: 0, y: -1, },
- { x: 1, y: -1, }, { x: -4, y: 0, }, { x: -3, y: 0, }, { x: -2, y: 0, }, { x: -1, y: 0, }]
+ { x: 1, y: -1, }, { x: -4, y: 0, }, { x: -3, y: 0, }, { x: -2, y: 0, },
+ { x: -1, y: 0, }]
];
var RefinementTemplates = [
{
coding: [{ x: 0, y: -1, }, { x: 1, y: -1, }, { x: -1, y: 0, }],
- reference: [{ x: 0, y: -1, }, { x: 1, y: -1, }, { x: -1, y: 0, }, { x: 0, y: 0, },
- { x: 1, y: 0, }, { x: -1, y: 1, }, { x: 0, y: 1, }, { x: 1, y: 1, }],
+ reference: [{ x: 0, y: -1, }, { x: 1, y: -1, }, { x: -1, y: 0, },
+ { x: 0, y: 0, }, { x: 1, y: 0, }, { x: -1, y: 1, },
+ { x: 0, y: 1, }, { x: 1, y: 1, }],
},
{
- coding: [{ x: -1, y: -1, }, { x: 0, y: -1, }, { x: 1, y: -1, }, { x: -1, y: 0, }],
- reference: [{ x: 0, y: -1, }, { x: -1, y: 0, }, { x: 0, y: 0, }, { x: 1, y: 0, },
- { x: 0, y: 1, }, { x: 1, y: 1, }],
+ coding: [{ x: -1, y: -1, }, { x: 0, y: -1, }, { x: 1, y: -1, },
+ { x: -1, y: 0, }],
+ reference: [{ x: 0, y: -1, }, { x: -1, y: 0, }, { x: 0, y: 0, },
+ { x: 1, y: 0, }, { x: 0, y: 1, }, { x: 1, y: 1, }],
}
];
```
2017-06-02 18:16:24 +09:00
|
|
|
dir: (vertical ? 'ttb' : (isLTR ? 'ltr' : 'rtl')),
|
2017-04-02 23:14:30 +09:00
|
|
|
};
|
|
|
|
}
|
|
|
|
|
|
|
|
// These are used in bidi(), which is called frequently. We re-use them on
|
|
|
|
// each call to avoid unnecessary allocations.
|
|
|
|
var chars = [];
|
|
|
|
var types = [];
|
|
|
|
|
|
|
|
function bidi(str, startLevel, vertical) {
|
|
|
|
var isLTR = true;
|
|
|
|
var strLength = str.length;
|
|
|
|
if (strLength === 0 || vertical) {
|
|
|
|
return createBidiText(str, isLTR, vertical);
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
// Get types and fill arrays
|
|
|
|
chars.length = strLength;
|
|
|
|
types.length = strLength;
|
|
|
|
var numBidi = 0;
|
|
|
|
|
|
|
|
var i, ii;
|
|
|
|
for (i = 0; i < strLength; ++i) {
|
|
|
|
chars[i] = str.charAt(i);
|
|
|
|
|
|
|
|
var charCode = str.charCodeAt(i);
|
|
|
|
var charType = 'L';
|
|
|
|
if (charCode <= 0x00ff) {
|
|
|
|
charType = baseTypes[charCode];
|
|
|
|
} else if (0x0590 <= charCode && charCode <= 0x05f4) {
|
|
|
|
charType = 'R';
|
|
|
|
} else if (0x0600 <= charCode && charCode <= 0x06ff) {
|
|
|
|
charType = arabicTypes[charCode & 0xff];
|
|
|
|
if (!charType) {
|
|
|
|
warn('Bidi: invalid Unicode character ' + charCode.toString(16));
|
2014-03-09 05:49:53 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
} else if (0x0700 <= charCode && charCode <= 0x08AC) {
|
|
|
|
charType = 'AL';
|
|
|
|
}
|
|
|
|
if (charType === 'R' || charType === 'AL' || charType === 'AN') {
|
|
|
|
numBidi++;
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
types[i] = charType;
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
// Detect the bidi method
|
|
|
|
// - If there are no rtl characters then no bidi needed
|
|
|
|
// - If less than 30% chars are rtl then string is primarily ltr
|
|
|
|
// - If more than 30% chars are rtl then string is primarily rtl
|
|
|
|
if (numBidi === 0) {
|
|
|
|
isLTR = true;
|
|
|
|
return createBidiText(str, isLTR);
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
if (startLevel === -1) {
|
|
|
|
if ((numBidi / strLength) < 0.3) {
|
|
|
|
isLTR = true;
|
|
|
|
startLevel = 0;
|
|
|
|
} else {
|
|
|
|
isLTR = false;
|
|
|
|
startLevel = 1;
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
var levels = [];
|
|
|
|
for (i = 0; i < strLength; ++i) {
|
|
|
|
levels[i] = startLevel;
|
2012-09-12 08:42:24 +09:00
|
|
|
}
|
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
X1-X10: skip most of this, since we are NOT doing the embeddings.
|
|
|
|
*/
|
|
|
|
var e = (isOdd(startLevel) ? 'R' : 'L');
|
|
|
|
var sor = e;
|
|
|
|
var eor = sor;
|
|
|
|
|
|
|
|
/*
|
|
|
|
W1. Examine each non-spacing mark (NSM) in the level run, and change the
|
|
|
|
type of the NSM to the type of the previous character. If the NSM is at the
|
|
|
|
start of the level run, it will get the type of sor.
|
|
|
|
*/
|
|
|
|
var lastType = sor;
|
|
|
|
for (i = 0; i < strLength; ++i) {
|
|
|
|
if (types[i] === 'NSM') {
|
|
|
|
types[i] = lastType;
|
|
|
|
} else {
|
|
|
|
lastType = types[i];
|
|
|
|
}
|
|
|
|
}
|
2014-03-12 13:48:50 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
W2. Search backwards from each instance of a European number until the
|
|
|
|
first strong type (R, L, AL, or sor) is found. If an AL is found, change
|
|
|
|
the type of the European number to Arabic number.
|
|
|
|
*/
|
|
|
|
lastType = sor;
|
|
|
|
var t;
|
|
|
|
for (i = 0; i < strLength; ++i) {
|
|
|
|
t = types[i];
|
|
|
|
if (t === 'EN') {
|
|
|
|
types[i] = (lastType === 'AL') ? 'AN' : 'EN';
|
|
|
|
} else if (t === 'R' || t === 'L' || t === 'AL') {
|
|
|
|
lastType = t;
|
2014-03-09 05:49:53 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
W3. Change all ALs to R.
|
|
|
|
*/
|
|
|
|
for (i = 0; i < strLength; ++i) {
|
|
|
|
t = types[i];
|
|
|
|
if (t === 'AL') {
|
|
|
|
types[i] = 'R';
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
W4. A single European separator between two European numbers changes to a
|
|
|
|
European number. A single common separator between two numbers of the same
|
|
|
|
type changes to that type:
|
|
|
|
*/
|
|
|
|
for (i = 1; i < strLength - 1; ++i) {
|
|
|
|
if (types[i] === 'ES' && types[i - 1] === 'EN' && types[i + 1] === 'EN') {
|
|
|
|
types[i] = 'EN';
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
if (types[i] === 'CS' &&
|
|
|
|
(types[i - 1] === 'EN' || types[i - 1] === 'AN') &&
|
|
|
|
types[i + 1] === types[i - 1]) {
|
|
|
|
types[i] = types[i - 1];
|
|
|
|
}
|
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
W5. A sequence of European terminators adjacent to European numbers changes
|
|
|
|
to all European numbers:
|
|
|
|
*/
|
|
|
|
for (i = 0; i < strLength; ++i) {
|
|
|
|
if (types[i] === 'EN') {
|
|
|
|
// do before
|
|
|
|
var j;
|
|
|
|
for (j = i - 1; j >= 0; --j) {
|
|
|
|
if (types[j] !== 'ET') {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
types[j] = 'EN';
|
|
|
|
}
|
|
|
|
// do after
|
|
|
|
for (j = i + 1; j < strLength; ++j) {
|
|
|
|
if (types[j] !== 'ET') {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
types[j] = 'EN';
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
W6. Otherwise, separators and terminators change to Other Neutral:
|
|
|
|
*/
|
|
|
|
for (i = 0; i < strLength; ++i) {
|
|
|
|
t = types[i];
|
|
|
|
if (t === 'WS' || t === 'ES' || t === 'ET' || t === 'CS') {
|
|
|
|
types[i] = 'ON';
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
W7. Search backwards from each instance of a European number until the
|
|
|
|
first strong type (R, L, or sor) is found. If an L is found, then change
|
|
|
|
the type of the European number to L.
|
|
|
|
*/
|
|
|
|
lastType = sor;
|
|
|
|
for (i = 0; i < strLength; ++i) {
|
|
|
|
t = types[i];
|
|
|
|
if (t === 'EN') {
|
|
|
|
types[i] = ((lastType === 'L') ? 'L' : 'EN');
|
|
|
|
} else if (t === 'R' || t === 'L') {
|
|
|
|
lastType = t;
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
N1. A sequence of neutrals takes the direction of the surrounding strong
|
|
|
|
text if the text on both sides has the same direction. European and Arabic
|
|
|
|
numbers are treated as though they were R. Start-of-level-run (sor) and
|
|
|
|
end-of-level-run (eor) are used at level run boundaries.
|
|
|
|
*/
|
|
|
|
for (i = 0; i < strLength; ++i) {
|
|
|
|
if (types[i] === 'ON') {
|
|
|
|
var end = findUnequal(types, i + 1, 'ON');
|
|
|
|
var before = sor;
|
|
|
|
if (i > 0) {
|
|
|
|
before = types[i - 1];
|
2014-03-09 05:49:53 +09:00
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
var after = eor;
|
|
|
|
if (end + 1 < strLength) {
|
|
|
|
after = types[end + 1];
|
2014-03-09 05:49:53 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
if (before !== 'L') {
|
|
|
|
before = 'R';
|
2014-03-09 05:49:53 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
if (after !== 'L') {
|
|
|
|
after = 'R';
|
2014-03-09 05:49:53 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
if (before === after) {
|
|
|
|
setValues(types, i, end, before);
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
i = end - 1; // reset to end (-1 so next iteration is ok)
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
N2. Any remaining neutrals take the embedding direction.
|
|
|
|
*/
|
|
|
|
for (i = 0; i < strLength; ++i) {
|
|
|
|
if (types[i] === 'ON') {
|
|
|
|
types[i] = e;
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
I1. For all characters with an even (left-to-right) embedding direction,
|
|
|
|
those of type R go up one level and those of type AN or EN go up two
|
|
|
|
levels.
|
|
|
|
I2. For all characters with an odd (right-to-left) embedding direction,
|
|
|
|
those of type L, EN or AN go up one level.
|
|
|
|
*/
|
|
|
|
for (i = 0; i < strLength; ++i) {
|
|
|
|
t = types[i];
|
|
|
|
if (isEven(levels[i])) {
|
|
|
|
if (t === 'R') {
|
|
|
|
levels[i] += 1;
|
|
|
|
} else if (t === 'AN' || t === 'EN') {
|
|
|
|
levels[i] += 2;
|
2014-03-09 05:49:53 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
} else { // isOdd
|
|
|
|
if (t === 'L' || t === 'AN' || t === 'EN') {
|
|
|
|
levels[i] += 1;
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
L1. On each line, reset the embedding level of the following characters to
|
|
|
|
the paragraph embedding level:
|
|
|
|
|
|
|
|
segment separators,
|
|
|
|
paragraph separators,
|
|
|
|
any sequence of whitespace characters preceding a segment separator or
|
|
|
|
paragraph separator, and any sequence of white space characters at the end
|
|
|
|
of the line.
|
|
|
|
*/
|
|
|
|
|
|
|
|
// don't bother as text is only single line
|
|
|
|
|
|
|
|
/*
|
|
|
|
L2. From the highest level found in the text to the lowest odd level on
|
|
|
|
each line, reverse any contiguous sequence of characters that are at that
|
|
|
|
level or higher.
|
|
|
|
*/
|
|
|
|
|
|
|
|
// find highest level & lowest odd level
|
|
|
|
var highestLevel = -1;
|
|
|
|
var lowestOddLevel = 99;
|
|
|
|
var level;
|
|
|
|
for (i = 0, ii = levels.length; i < ii; ++i) {
|
|
|
|
level = levels[i];
|
|
|
|
if (highestLevel < level) {
|
|
|
|
highestLevel = level;
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
if (lowestOddLevel > level && isOdd(level)) {
|
|
|
|
lowestOddLevel = level;
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
// now reverse between those limits
|
|
|
|
for (level = highestLevel; level >= lowestOddLevel; --level) {
|
|
|
|
// find segments to reverse
|
|
|
|
var start = -1;
|
2014-04-08 06:42:54 +09:00
|
|
|
for (i = 0, ii = levels.length; i < ii; ++i) {
|
2017-04-02 23:14:30 +09:00
|
|
|
if (levels[i] < level) {
|
|
|
|
if (start >= 0) {
|
|
|
|
reverseValues(chars, start, i);
|
|
|
|
start = -1;
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
} else if (start < 0) {
|
|
|
|
start = i;
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
if (start >= 0) {
|
|
|
|
reverseValues(chars, start, levels.length);
|
|
|
|
}
|
|
|
|
}
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
L3. Combining marks applied to a right-to-left base character will at this
|
|
|
|
point precede their base character. If the rendering engine expects them to
|
|
|
|
follow the base characters in the final display process, then the ordering
|
|
|
|
of the marks and the base character must be reversed.
|
|
|
|
*/
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
// don't bother for now
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
/*
|
|
|
|
L4. A character that possesses the mirrored property as specified by
|
|
|
|
Section 4.7, Mirrored, must be depicted by a mirrored glyph if the resolved
|
|
|
|
directionality of that character is R.
|
|
|
|
*/
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
// don't mirror as characters are already mirrored in the pdf
|
2012-03-16 19:27:09 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
// Finally, return string
|
|
|
|
for (i = 0, ii = chars.length; i < ii; ++i) {
|
|
|
|
var ch = chars[i];
|
|
|
|
if (ch === '<' || ch === '>') {
|
|
|
|
chars[i] = '';
|
2012-03-16 19:27:09 +09:00
|
|
|
}
|
2012-03-19 05:49:04 +09:00
|
|
|
}
|
2017-04-02 23:14:30 +09:00
|
|
|
return createBidiText(chars.join(''), isLTR);
|
|
|
|
}
|
2012-03-19 05:49:04 +09:00
|
|
|
|
2017-04-02 23:14:30 +09:00
|
|
|
export {
|
|
|
|
bidi,
|
|
|
|
};
|