pdf.js/PDFFont.js

1499 lines
45 KiB
JavaScript
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

/* -*- Mode: Java; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- /
/* vim: set shiftwidth=2 tabstop=2 autoindent cindent expandtab: */
var kMaxFontFileSize = 100000;
/**
* This dictionary holds decoded fonts data.
*/
var Fonts = new Dict();
/**
* This simple object keep a trace of the fonts that have already been decoded
* by storing a map between the name given by the PDF and the name gather from
* the font (aka the PostScript code of the font itself for Type1 font).
*/
var _Fonts = {};
var Stack = function() {
var innerStack = [];
this.push = function(aOperand) {
innerStack.push(aOperand);
};
this.pop = function() {
if (!this.count())
throw new Error("stackunderflow");
return innerStack.pop();
};
this.peek = function() {
if (!this.count())
return null;
return innerStack[innerStack.length - 1];
};
this.get = function(aIndex) {
return innerStack[aIndex];
};
this.clear = function() {
innerStack = [];
};
this.count = function() {
return innerStack.length;
};
this.dump = function() {
for (var i = 0; i < this.length; i++)
log(innerStack[i]);
};
this.clone = function() {
return innerStack.slice();
};
};
var Base64Encoder = {
encode: function(aFontName, aData) {
var str = [];
var count = aData.length;
for (var i = 0; i < count; i++)
str.push(aData.getChar ? aData.getChar() : String.fromCharCode(aData[i]));
// Add the css rule to the document
var fontData = window.btoa(str.join(""));
var url = "url(data:font/otf;base64," + fontData + ");";
document.styleSheets[0].insertRule("@font-face { font-family: '" + aFontName + "'; src: " + url + " }", 0);
return fontData;
}
};
var TrueTypeFont = function(aFontName, aFontFile) {
if (_Fonts[aFontName])
return;
_Fonts[aFontName] = true;
var debug = true;
function dump(aMsg) {
if (debug)
log(aMsg);
}
dump("Loading a TrueType font: " + aFontName);
var fontData = Base64Encoder.encode(aFontName, aFontFile);
Fonts.set(aFontName, fontData);
};
var Type1Parser = function(aAsciiStream, aBinaryStream) {
var lexer = aAsciiStream ? new Lexer(aAsciiStream) : null;
// Turn on this flag for additional debugging logs
var debug = false;
var dump = function(aData) {
if (debug)
log(aData);
};
// Hold the fontName as declared inside the /FontName postscript directive
// XXX This is a hack but at the moment I need it to map the name declared
// in the PDF and the name in the PS code.
var fontName = "";
/*
* Parse a whole Type1 font stream (from the first segment to the last)
* assuming the 'eexec' block is binary data and fill up the 'Fonts'
* dictionary with the font informations.
*/
var self = this;
this.parse = function() {
if (!debug) {
while (!processNextToken()) {};
return fontName;
} else {
// debug mode is used to debug postcript processing
setTimeout(function() {
if (!processNextToken())
self.parse();
}, 0);
}
};
/*
* Decrypt a Sequence of Ciphertext Bytes to Produce the Original Sequence
* of Plaintext Bytes. The function took a key as a parameter which can be
* for decrypting the eexec block of for decoding charStrings.
*/
var kEexecEncryptionKey = 55665;
var kCharStringsEncryptionKey = 4330;
function decrypt(aStream, aKey, aDiscardNumber) {
var start = Date.now();
var r = aKey, c1 = 52845, c2 = 22719;
var decryptedString = [];
var value = "";
var count = aStream.length;
for (var i = 0; i < count; i++) {
value = aStream.getByte();
decryptedString[i] = String.fromCharCode(value ^ (r >> 8));
r = ((value + r) * c1 + c2) & ((1 << 16) - 1);
}
var end = Date.now();
dump("Time to decrypt string of length " + count + " is " + (end - start));
return decryptedString.slice(aDiscardNumber);
};
/*
* CharStrings are encoded following the the CharString Encoding sequence
* describe in Chapter 6 of the "Adobe Type1 Font Format" specification.
* The value in a byte indicates a command, a number, or subsequent bytes
* that are to be interpreted in a special way.
*
* CharString Number Encoding:
* A CharString byte containing the values from 32 through 255 inclusive
* indicate an integer. These values are decoded in four ranges.
*
* 1. A CharString byte containing a value, v, between 32 and 246 inclusive,
* indicate the integer v - 139. Thus, the integer values from -107 through
* 107 inclusive may be encoded in single byte.
*
* 2. A CharString byte containing a value, v, between 247 and 250 inclusive,
* indicates an integer involving the next byte, w, according to the formula:
* [(v - 247) x 256] + w + 108
*
* 3. A CharString byte containing a value, v, between 251 and 254 inclusive,
* indicates an integer involving the next byte, w, according to the formula:
* -[(v - 251) * 256] - w - 108
*
* 4. A CharString containing the value 255 indicates that the next 4 bytes
* are a two complement signed integer. The first of these bytes contains the
* highest order bits, the second byte contains the next higher order bits
* and the fourth byte contain the lowest order bits.
*
*
* CharString Command Encoding:
* CharStrings commands are encoded in 1 or 2 bytes.
*
* Single byte commands are encoded in 1 byte that contains a value between
* 0 and 31 inclusive.
* If a command byte contains the value 12, then the value in the next byte
* indicates a command. This "escape" mechanism allows many extra commands
* to be encoded and this encoding technique helps to minimize the length of
* the charStrings.
*/
var charStringDictionary = {
"1": "hstem",
"3": "vstem",
"4": "vmoveto",
"5": "rlineto",
"6": "hlineto",
"7": "vlineto",
"8": "rrcurveto",
"9": "closepath",
"10": "callsubr",
"11": "return",
"12": {
"0": "dotsection",
"1": "vstem3",
"3": "hstem3",
"6": "seac",
"7": "sbw",
"12": "div",
"16": "callothersubr",
"17": "pop",
"33": "setcurrentpoint"
},
"13": "hsbw",
"14": "endchar",
"21": "rmoveto",
"22": "hmoveto",
"30": "vhcurveto",
"31": "hvcurveto"
};
function decodeCharString(aStream) {
var start = Date.now();
var charString = [];
var value = "";
var count = aStream.length;
for (var i = 0; i < count; i++) {
value = aStream.getByte();
if (value < 32) {
if (value == 12) {
value = charStringDictionary["12"][aStream.getByte()];
i++;
} else {
value = charStringDictionary[value];
}
} else if (value <= 246) {
value = parseInt(value) - 139;
} else if (value <= 250) {
value = ((value - 247) * 256) + parseInt(aStream.getByte()) + 108;
i++;
} else if (value <= 254) {
value = -((value - 251) * 256) - parseInt(aStream.getByte()) - 108;
i++;
} else {
var byte = aStream.getByte();
var high = (byte >> 1);
value = (byte - high) << 24 | aStream.getByte() << 16 |
aStream.getByte() << 8 | aStream.getByte();
i += 4;
}
charString.push(value);
}
var end = Date.now();
dump("Time to decode charString of length " + count + " is " + (end - start));
return charString;
}
/*
* The operand stack holds arbitrary PostScript objects that are the operands
* and results of PostScript operators being executed. The interpreter pushes
* objects on the operand stack when it encounters them as literal data in a
* program being executed. When an operator requires one or more operands, it
* obtains them by popping them off the top of the operand stack. When an
* operator returns one or more results, it does so by pushing them on the
* operand stack.
*/
var operandStack = new Stack();
// Flag indicating if the topmost operand of the operandStack is an array
var operandIsArray = 0;
/*
* The dictionary stack holds only dictionary objects. The current set of
* dictionaries on the dictionary stack defines the environment for all
* implicit name searches, such as those that occur when the interpreter
* encounters an executable name. The role of the dictionary stack is
* introduced in Section 3.3, “Data Types and Objects,” and is further
* explained in Section 3.5, “Execution.” of the PostScript Language
* Reference.
*/
var systemDict = new Dict(),
globalDict = new Dict(),
userDict = new Dict();
var dictionaryStack = new Stack();
dictionaryStack.push(systemDict);
dictionaryStack.push(globalDict);
dictionaryStack.push(userDict);
/*
* The execution stack holds executable objects (mainly procedures and files)
* that are in intermediate stages of execution. At any point in the
* execution of a PostScript program, this stack represents the programs
* call stack. Whenever the interpreter suspends execution of an object to
* execute some other object, it pushes the new object on the execution
* stack. When the interpreter finishes executing an object, it pops that
* object off the execution stack and resumes executing the suspended object
* beneath it.
*/
var executionStack = new Stack();
/*
* Return the next token in the execution stack
*/
function nextInStack() {
var currentProcedure = executionStack.peek();
if (currentProcedure) {
var command = currentProcedure.shift();
if (!currentProcedure.length)
executionStack.pop();
return command;
}
return lexer.getObj();
};
/*
* Get the next token from the executionStack and process it.
* Actually the function does not process the third segment of a Type1 font
* and end on 'closefile'.
*
* The method thrown an error if it encounters an unknown token.
*/
function processNextToken() {
var obj = nextInStack();
if (operandIsArray && !IsCmd(obj, "{") && !IsCmd(obj, "[") &&
!IsCmd(obj, "]") && !IsCmd(obj, "}")) {
dump("Adding an object: " + obj +" to array " + operandIsArray);
var currentArray = operandStack.peek();
for (var i = 1; i < operandIsArray; i++)
currentArray = currentArray[currentArray.length - 1];
currentArray.push(obj);
} else if (IsBool(obj) || IsInt(obj) || IsNum(obj) || IsString(obj)) {
dump("Value: " + obj);
operandStack.push(obj);
} else if (IsName(obj)) {
dump("Name: " + obj.name);
operandStack.push(obj.name);
} else if (IsCmd(obj)) {
var command = obj.cmd;
dump(command);
switch (command) {
case "[":
case "{":
dump("Start" + (command == "{" ? " Executable " : " ") + "Array");
operandIsArray++;
var currentArray = operandStack;
for (var i = 1; i < operandIsArray; i++)
if (currentArray.peek)
currentArray = currentArray.peek();
else
currentArray = currentArray[currentArray.length - 1];
currentArray.push([]);
break;
case "]":
case "}":
var currentArray = operandStack.peek();
for (var i = 1; i < operandIsArray; i++)
currentArray = currentArray[currentArray.length - 1];
dump("End" + (command == "}" ? " Executable " : " ") + "Array: " + currentArray.join(" "));
operandIsArray--;
break;
case "if":
var procedure = operandStack.pop();
var bool = operandStack.pop();
if (!IsBool(bool)) {
dump("if: " + bool);
// we need to execute things, let be dirty
executionStack.push(bool);
} else {
dump("if ( " + bool + " ) { " + procedure + " }");
if (bool)
executionStack.push(procedure);
}
break;
case "ifelse":
var procedure1 = operandStack.pop();
var procedure2 = operandStack.pop();
var bool = !!operandStack.pop();
dump("if ( " + bool + " ) { " + procedure2 + " } else { " + procedure1 + " }");
executionStack.push(bool ? procedure2 : procedure1);
break;
case "for":
var procedure = operandStack.pop();
var limit = operandStack.pop();
var increment = operandStack.pop();
var initial = operandStack.pop();
for (var i = 0; i < limit; i += increment) {
operandStack.push(i);
executionStack.push(procedure.slice());
}
break;
case "dup":
dump("duplicate: " + operandStack.peek());
operandStack.push(operandStack.peek());
break;
case "mark":
operandStack.push("mark");
break;
case "cleartomark":
var command = "";
do {
command = operandStack.pop();
} while (command != "mark");
break;
case "put":
var data = operandStack.pop();
var indexOrKey = operandStack.pop();
var object = operandStack.pop();
dump("put " + data + " in " + object + "[" + indexOrKey + "]");
object.set ? object.set(indexOrKey, data)
: object[indexOrKey] = data;
break;
case "pop":
operandStack.pop();
break;
case "exch":
var operand1 = operandStack.pop();
var operand2 = operandStack.pop();
operandStack.push(operand1);
operandStack.push(operand2);
break;
case "get":
var indexOrKey = operandStack.pop();
var object = operandStack.pop();
var data = object.get ? object.get(indexOrKey) : object[indexOrKey];
dump("get " + object + "[" + indexOrKey + "]: " + data);
operandStack.push(data);
break;
case "currentdict":
var dict = dictionaryStack.peek();
operandStack.push(dict);
break;
case "systemdict":
operandStack.push(systemDict);
break;
case "readonly":
case "executeonly":
case "noaccess":
// Do nothing for the moment
break;
case "currentfile":
operandStack.push("currentfile");
break;
case "array":
var size = operandStack.pop();
var array = new Array(size);
operandStack.push(array);
break;
case "dict":
var size = operandStack.pop();
var dict = new Dict(size);
operandStack.push(dict);
break;
case "begin":
dictionaryStack.push(operandStack.pop());
break;
case "end":
dictionaryStack.pop();
break;
case "def":
var value = operandStack.pop();
var key = operandStack.pop();
// XXX we don't want to do that here but for some reasons the names
// are different between what is declared and the FontName directive
if (key == "FontName" && Fonts.get(value)) {
// The font has already be decoded, stop!
return true;
}
dump("def: " + key + " = " + value);
dictionaryStack.peek().set(key, value);
break;
case "definefont":
var font = operandStack.pop();
var key = operandStack.pop();
dump("definefont " + font + " with key: " + key);
// The key will be the identifier to recognize this font
fontName = key;
Fonts.set(key, font);
operandStack.push(font);
break;
case "known":
var name = operandStack.pop();
var dict = operandStack.pop();
var data = !!dict.get(name);
dump("known: " + data + " :: " + name + " in dict: " + dict);
operandStack.push(data);
break;
case "exec":
executionStack.push(operandStack.pop());
break;
case "eexec":
// All the first segment data has been read, decrypt the second segment
// and start interpreting it in order to decode it
var file = operandStack.pop();
var eexecString = decrypt(aBinaryStream, kEexecEncryptionKey, 4).join("");
dump(eexecString);
lexer = new Lexer(new StringStream(eexecString));
break;
case "LenIV":
error("LenIV: argh! we need to modify the length of discard characters for charStrings");
break;
case "closefile":
var file = operandStack.pop();
return true;
break;
case "index":
var operands = [];
var size = operandStack.pop();
for (var i = 0; i < size; i++)
operands.push(operandStack.pop());
var newOperand = operandStack.peek();
while (operands.length)
operandStack.push(operands.pop());
operandStack.push(newOperand);
break;
case "string":
var size = operandStack.pop();
var str = (new Array(size + 1)).join(" ");
operandStack.push(str);
break;
case "readstring":
var str = operandStack.pop();
var size = str.length;
var file = operandStack.pop();
// Add '1' because of the space separator, this is dirty
var stream = lexer.stream.makeSubStream(lexer.stream.pos + 1, size);
lexer.stream.skip(size + 1);
var charString = decrypt(stream, kCharStringsEncryptionKey, 4).join("");
var charStream = new StringStream(charString);
var decodedCharString = decodeCharString(charStream);
dump("decodedCharString: " + decodedCharString);
operandStack.push(decodedCharString);
// boolean indicating if the operation is a success or not
operandStack.push(true);
break;
case "StandardEncoding":
// For some reason the value is considered as a command, maybe it is
// because of the uppercase 'S'
operandStack.push(obj.cmd);
break;
default:
var command = null;
if (IsCmd(obj)) {
for (var i = 0; i < dictionaryStack.count(); i++) {
if (command = dictionaryStack.get(i).get(obj.cmd)) {
dump("found in dictionnary for " + obj.cmd + " command: " + command);
executionStack.push(command.slice());
break;
}
}
}
if (!command) {
log("operandStack: " + operandStack);
log("dictionaryStack: " + dictionaryStack);
log(obj);
error("Unknow command while parsing font");
}
break;
}
} else if (obj) {
dump("unknow: " + obj);
operandStack.push(obj);
} else { // The End!
operandStack.dump();
return true;
}
return false;
}
/*
* Flatten the commands by interpreting the postscript code and replacing
* every 'callsubr', 'callothersubr' by the real commands.
* At the moment OtherSubrs are not fully supported and only otherSubrs 0-4
* as descrived in 'Using Subroutines' of 'Adobe Type 1 Font Format',
* chapter 8.
*/
this.flattenCharstring = function(aCharstring, aDefaultWidth, aSubrs) {
operandStack.clear();
executionStack.clear();
executionStack.push(aCharstring);
var leftSidebearing = 0;
var lastPoint = 0;
while (true) {
var obj = nextInStack();
if (IsBool(obj) || IsInt(obj) || IsNum(obj)) {
dump("Value: " + obj);
operandStack.push(obj);
} else if (IsString(obj)) {
dump("String: " + obj);
switch (obj) {
case "hsbw":
var charWidthVector = operandStack.pop();
leftSidebearing = operandStack.pop();
if (charWidthVector != aDefaultWidth)
operandStack.push(charWidthVector - aDefaultWidth);
break;
case "rmoveto":
var dy = operandStack.pop();
var dx = operandStack.pop();
if (leftSidebearing) {
dx += leftSidebearing;
leftSidebearing = 0;
}
operandStack.push(dx);
operandStack.push(dy);
operandStack.push("rmoveto");
break;
case "div":
var num2 = operandStack.pop();
var num1 = operandStack.pop();
operandStack.push(num2 / num1);
break;
case "setcurrentpoint":
case "dotsection":
case "seac":
case "sbw":
error(obj + " parsing is not implemented (yet)");
break;
case "closepath":
case "return":
break;
case "vstem3":
case "vstem":
operandStack.push("vstem");
break;
case "hstem":
case "hstem3":
operandStack.push("hstem");
break;
case "callsubr":
var index = operandStack.pop();
executionStack.push(aSubrs[index].slice());
break;
case "callothersubr":
// XXX need to be improved
var index = operandStack.pop();
var count = operandStack.pop();
var data = operandStack.pop();
if (index != 3)
dump("callothersubr for index: " + index);
operandStack.push(3);
operandStack.push("callothersubr");
break;
case "endchar":
operandStack.push("endchar");
return operandStack.clone();
case "pop":
operandStack.pop();
break;
default:
operandStack.push(obj);
break;
}
}
}
}
};
var type1hack = false;
var Type1Font = function(aFontName, aFontFile) {
if (_Fonts[aFontName])
return;
_Fonts[aFontName] = true;
// All Type1 font program should begin with the comment %!
if (aFontFile.getByte() != 0x25 || aFontFile.getByte() != 0x21)
error("Invalid file header");
if (!type1hack || true) {
type1hack = true;
var start = Date.now();
var ASCIIStream = aFontFile.makeSubStream(0, aFontFile.dict.get("Length1"), aFontFile.dict);
var binaryStream = aFontFile.makeSubStream(aFontFile.dict.get("Length1"), aFontFile.dict.get("Length2"), aFontFile.dict);
this.parser = new Type1Parser(ASCIIStream, binaryStream);
var fontName = this.parser.parse();
var font = Fonts.get(fontName);
var fontData = this.convertToOTF(this.convertToCFF(font), font);
fontData = Base64Encoder.encode(aFontName, fontData);
Fonts.set(aFontName, fontData);
var end = Date.now();
log("Time to parse font is:" + (end - start));
}
};
Type1Font.prototype = {
getDefaultWidth: function(aCharstrings) {
var defaultWidth = 0;
var defaultUsedCount = 0;
var widths = {};
for (var i = 0; i < aCharstrings.length; i++) {
var width = aCharstrings[i].charstring[1];
var usedCount = (widths[width] || 0) + 1;
if (usedCount > defaultUsedCount) {
defaultUsedCount = usedCount;
defaultWidth = width;
}
widths[width] = usedCount;
}
return parseInt(defaultWidth);
},
createCFFIndexHeader: function(aObjects, aIsByte) {
var data = [];
// First 2 bytes contains the number of objects contained into this index
var count = aObjects.length;
if (count ==0)
return [0x00, 0x00, 0x00];
var bytes = this.integerToBytes(count, 2);
for (var i = 0; i < bytes.length; i++)
data.push(bytes[i]);
// Next byte contains the offset size use to reference object in the file
// Actually we're using 0x04 to be sure to be able to store everything
// without thinking of it while coding.
data.push(0x04);
// Add another offset after this one because we need a new offset
var relativeOffset = 1;
for (var i = 0; i < count + 1; i++) {
var bytes = this.integerToBytes(relativeOffset, 4);
for (var j = 0; j < bytes.length; j++)
data.push(bytes[j]);
if (aObjects[i])
relativeOffset += aObjects[i].length;
}
for (var i =0; i < count; i++) {
for (var j = 0; j < aObjects[i].length; j++)
data.push(aIsByte ? aObjects[i][j] : aObjects[i].charCodeAt(j));
}
return data;
},
integerToBytes: function(aValue, aBytesCount) {
var bytes = [];
for (var i = 0; i < aBytesCount; i++)
bytes[i] = 0x00;
do {
bytes[--aBytesCount] = (aValue & 0xFF);
aValue = aValue >> 8;
} while (aBytesCount && aValue > 0);
return bytes;
},
bytesToInteger: function(aBytesArray) {
var value = 0;
for (var i = 0; i < aBytesArray.length; i++)
value = (value << 8) + aBytesArray[i];
return value;
},
encodeNumber: function(aValue) {
var x = 0;
// XXX we don't really care about Type2 optimization here...
if (aValue >= -32768 && aValue <= 32767) {
return [
28,
this.integerToBytes(aValue >> 8, 1),
this.integerToBytes(aValue, 1)
];
} else if (aValue >= (-2147483647-1) && aValue <= 2147483647) {
return [
0xFF,
this.integerToBytes(aValue >> 24, 1),
this.integerToBytes(aValue >> 16, 1),
this.integerToBytes(aValue >> 8, 1),
this.integerToBytes(aValue, 1)
];
} else {
error("Value: " + aValue + " is not allowed");
}
},
getOrderedCharStrings: function(aFont) {
var dict = aFont.get("CharStrings")
var charstrings = [];
for (var glyph in dict.map) {
charstrings.push({
glyph: glyph,
charstring: dict.map[glyph].slice()
});
}
charstrings.sort(function(a, b) {
return CFFStrings.indexOf(a.glyph) > CFFStrings.indexOf(b.glyph);
});
charstrings.shift();
return charstrings;
},
convertToCFF: function(aFont) {
var debug = false;
function dump(aMsg) {
if (debug)
log(aMsg);
};
var charstrings = this.getOrderedCharStrings(aFont);
var defaultWidth = this.getDefaultWidth(charstrings);
var charstringsCount = 0;
var charstringsDataLength = 0;
var glyphs = [];
var glyphsChecker = {};
var subrs = aFont.get("Private").get("Subrs");
var parser = new Type1Parser();
for (var i = 0; i < charstrings.length; i++) {
var charstring = charstrings[i].charstring.slice();
var glyph = charstrings[i].glyph;
if (glyphsChecker[glyph])
error("glyphs already exists!");
glyphsChecker[glyph] = true;
var flattened = parser.flattenCharstring(charstring, defaultWidth, subrs);
glyphs.push(flattened);
charstringsCount++;
charstringsDataLength += flattened.length;
}
dump("There is " + charstringsCount + " glyphs (size: " + charstringsDataLength + ")");
// Create a CFF font data
var cff = new Uint8Array(kMaxFontFileSize);
var currentOffset = 0;
// Font header (major version, minor version, header size, offset size)
var header = [0x01, 0x00, 0x04, 0x04];
currentOffset += header.length;
cff.set(header);
// Names Index
var nameIndex = this.createCFFIndexHeader([aFont.get("FontName")]);
cff.set(nameIndex, currentOffset);
currentOffset += nameIndex.length;
// Calculate strings before writing the TopDICT index in order
// to calculate correct relative offsets for storing 'charset'
// and 'charstrings' data
var fontInfo = aFont.get("FontInfo");
var version = fontInfo.get("version");
var notice = fontInfo.get("Notice");
var fullName = fontInfo.get("FullName");
var familyName = fontInfo.get("FamilyName");
var weight = fontInfo.get("Weight");
var strings = [version, notice, fullName,
familyName, weight];
var stringsIndex = this.createCFFIndexHeader(strings);
var stringsDataLength = stringsIndex.length;
// Create the global subroutines index
var globalSubrsIndex = this.createCFFIndexHeader([]);
// Fill the charset header (first byte is the encoding)
var charset = [0x00];
for (var i = 0; i < glyphs.length; i++) {
var index = CFFStrings.indexOf(charstrings[i].glyph);
var bytes = this.integerToBytes(index, 2);
charset.push(bytes[0]);
charset.push(bytes[1]);
}
// Convert charstrings
var getNumFor = {
"hstem": 1,
"vstem": 3,
"vmoveto": 4,
"rlineto": 5,
"hlineto": 6,
"vlineto": 7,
"rrcurveto": 8,
"endchar": 14,
"rmoveto": 21,
"hmoveto": 22,
"vhcurveto": 30,
"hvcurveto": 31,
};
// Encode the glyph and add it to the FUX
var r = [[0x40, 0x0E]];
for (var i = 0; i < glyphs.length; i++) {
var data = glyphs[i].slice();
var charstring = [];
for (var j = 0; j < data.length; j++) {
var c = data[j];
if (!IsNum(c)) {
var token = getNumFor[c];
if (!token)
error(c);
charstring.push(token);
} else {
try {
var bytes = this.encodeNumber(c);
} catch(e) {
log("Glyph " + i + " has a wrong value: " + c + " in charstring: " + data);
log("the default value is glyph " + charstrings[i].glyph + " and is supposed to be: " + charstrings[i].charstring);
}
for (var k = 0; k < bytes.length; k++)
charstring.push(bytes[k]);
}
}
r.push(charstring);
}
var charstringsIndex = this.createCFFIndexHeader(r, true);
charstringsIndex = charstringsIndex.join(" ").split(" "); // XXX why?
var fontBBox = aFont.get("FontBBox");
//Top Dict Index
var topDictIndex = [
0x00, 0x01, 0x01, 0x01, 0x30,
248, 27, 0, // version
248, 28, 1, // Notice
248, 29, 2, // FullName
248, 30, 3, // FamilyName
248, 31, 4, // Weight
];
for (var i = 0; i < fontBBox.length; i++)
topDictIndex = topDictIndex.concat(this.encodeNumber(fontBBox[i]));
topDictIndex.push(5) // FontBBox;
var charsetOffset = currentOffset +
(topDictIndex.length + (4 + 4 + 4 + 7)) +
stringsIndex.length +
globalSubrsIndex.length;
topDictIndex = topDictIndex.concat(this.encodeNumber(charsetOffset));
topDictIndex.push(15); // charset
topDictIndex = topDictIndex.concat([28, 0, 0, 16]) // Encoding
var charstringsOffset = charsetOffset + (charstringsCount * 2) + 1;
topDictIndex = topDictIndex.concat(this.encodeNumber(charstringsOffset));
topDictIndex.push(17); // charstrings
topDictIndex = topDictIndex.concat([28, 0, 55])
var privateOffset = charstringsOffset + charstringsIndex.length;
topDictIndex = topDictIndex.concat(this.encodeNumber(privateOffset));
topDictIndex.push(18); // Private
topDictIndex = topDictIndex.join(" ").split(" ");
// Top Dict Index
cff.set(topDictIndex, currentOffset);
currentOffset += topDictIndex.length;
// Strings Index
cff.set(stringsIndex, currentOffset);
currentOffset += stringsIndex.length;
// Global Subrs Index
cff.set(globalSubrsIndex, currentOffset);
currentOffset += globalSubrsIndex.length;
// Charset Index
cff.set(charset, currentOffset);
currentOffset += charset.length;
// Fill charstrings data
cff.set(charstringsIndex, currentOffset);
currentOffset += charstringsIndex.length;
// Private Data
var privateData = [
248, 136, 20,
248, 136, 21,
119, 159, 248, 97, 159, 247, 87, 159, 6,
30, 10, 3, 150, 37, 255, 12, 9,
139, 12, 10,
172, 10,
172, 150, 143, 146, 150, 146, 12, 12,
247, 32, 11,
247, 10, 161, 147, 154, 150, 143, 12, 13,
139, 12, 14,
28, 0, 55, 19
];
cff.set(privateData, currentOffset);
currentOffset += privateData.length;
// Dump shit at the end of the file
var shit = [
0x00, 0x01, 0x01, 0x01,
0x13, 0x5D, 0x65, 0x64,
0x5E, 0x5B, 0xAF, 0x66,
0xBA, 0xBB, 0xB1, 0xB0,
0xB9, 0xBA, 0x65, 0xB2,
0x5C, 0x1F, 0x0B
];
cff.set(shit, currentOffset);
currentOffset += shit.length;
dump("==================== debug ====================");
//var file = new Uint8Array(cff, 0, currentOffset);
//var parser = new Type2Parser();
//parser.parse(new Stream(file));
var data = [];
for (var i = 0; i < currentOffset; i++)
data.push(cff[i]);
//log("== write to file");
//writeToFile(data, "/tmp/pdf.js.cff");
return data;
},
getMaxPower2: function(aNumber) {
var maxPower = 0;
var value = aNumber;
while (value >= 2) {
value /= 2;
maxPower++;
}
value = 2;
for (var i = 1; i < maxPower; i++)
value *= 2;
return value;
},
createOpenTypeHeader: function(aNumTables) {
// sfnt version (4 bytes)
var version = [0x4F, 0x54, 0x54, 0X4F];
// numTables (2 bytes)
var numTables = aNumTables;
// searchRange (2 bytes)
var searchRange = this.getMaxPower2(numTables) * 16;
// entrySelector (2 bytes)
var entrySelector = Math.log(this.getMaxPower2(numTables)) / Math.log(2);
// rangeShift (2 bytes)
var rangeShift = numTables * 16 - searchRange;
return [].concat(version,
this.integerToBytes(numTables, 2),
this.integerToBytes(searchRange, 2),
this.integerToBytes(entrySelector, 2),
this.integerToBytes(rangeShift, 2));
},
createTableEntry: function(aTag, aOffset, aData) {
// tag
var tag = [
aTag.charCodeAt(0),
aTag.charCodeAt(1),
aTag.charCodeAt(2),
aTag.charCodeAt(3)
];
// offset
var offset = aOffset;
// length
// Per spec tables must be 4-bytes align so add some 0x00 if needed
while (aData.length & 3)
aData.push(0x00);
var length = aData.length;
// checksum
var checksum = this.bytesToInteger(tag) + offset + length;
return [].concat(tag,
this.integerToBytes(checksum, 4),
this.integerToBytes(offset, 4),
this.integerToBytes(length, 4));
},
convertToOTF: function(aData, aFont) {
var otf = new Uint8Array(kMaxFontFileSize);
var currentOffset = 0;
var numTables = 9;
var header = this.createOpenTypeHeader(numTables);
otf.set(header, currentOffset);
currentOffset += header.length;
var baseOffset = numTables * (4 * 4) + currentOffset;
var virtualOffset = baseOffset;
var tableEntry = this.createTableEntry("CFF ", virtualOffset, aData);
otf.set(tableEntry, currentOffset);
currentOffset += tableEntry.length;
virtualOffset += aData.length;
var OS2 = [
0x00, 0x03, // version
0x02, 0x24, // xAvgCharWidth
0x01, 0xF4, // usWeightClass
0x00, 0x05, // usWidthClass
0x00, 0x00, // fstype
0x02, 0x8A, // ySubscriptXSize
0x02, 0xBB, // ySubscriptYSize
0x00, 0x00, // ySubscriptXOffset
0x00, 0x8C, // ySubscriptYOffset
0x02, 0x8A, // ySuperScriptXSize
0x02, 0xBB, // ySuperScriptYSize
0x00, 0x00, // ySuperScriptXOffset
0x01, 0xDF, // ySuperScriptYOffset
0x00, 0x31, // yStrikeOutSize
0x01, 0x02, // yStrikeOutPosition
0x00, 0x00, // sFamilyClass
0x02, 0x00, 0x06, 0x03, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, // Panose
0x00, 0x00, 0x00, 0x01, // ulUnicodeRange1 (Bits 0-31)
0x00, 0x00, 0x00, 0x00, // ulUnicodeRange2 (Bits 32-63)
0x00, 0x00, 0x00, 0x00, // ulUnicodeRange3 (Bits 64-95)
0x00, 0x00, 0x00, 0x00, // ulUnicodeRange4 (Bits 96-127)
0x47, 0x49, 0x60, 0x20, // achVendID
0x00, 0x20, // fsSelection
0x00, 0x2D, // usFirstCharIndex
0x00, 0x7A, // usLastCharIndex
0x00, 0x03, // sTypoAscender
0x00, 0x20, // sTypeDescender
0x00, 0x38, // sTypoLineGap
0x00, 0x5A, // usWinAscent
0x02, 0xB4, // usWinDescent
0x00, 0xCE, 0x00, 0x00, // ulCodePageRange1 (Bits 0-31)
0x00, 0x01, 0x00, 0x00, // ulCodePageRange2 (Bits 32-63)
0x00, 0x00, // sxHeight
0x00, 0x00, // sCapHeight
0x00, 0x01, // usDefaultChar
0x00, 0xCD, // usBreakChar
0x00, 0x02 // usMaxContext
];
var tableEntry = this.createTableEntry("OS/2", virtualOffset, OS2);
otf.set(tableEntry, currentOffset);
currentOffset += tableEntry.length;
virtualOffset += OS2.length;
/** CMAP */
var charstrings = this.getOrderedCharStrings(aFont);
if (false) {
var cmap = [
0x00, 0x00, // version
0x00, 0x01, // numTables
0x00, 0x01, // platformID
0x00, 0x00, // encodingID
0x00, 0x00, 0x00, 0x0C, //offset
0x00, 0x00,
0x01, 0x06,
0x00, 0x00
];
var data = [];
for (var i = 0; i < 262; i++) {
data.push(0x00);
}
for (var i = 0; i < charstrings.length; i++) {
var glyph = charstrings[i].glyph;
if (glyph == ".notdef")
continue;
var pos = GlyphsUnicode[glyph];
if (!pos)
error(charstrings[i].glyph + " does not have an entry in the glyphs table");
var b1 = parseInt("0x" + pos[0] + pos[1]);
var b2 = parseInt("0x" + pos[2] + pos[3]);
var num = this.bytesToInteger([b1, b2]);
data[num] = i + 1;
}
cmap = cmap.concat(data);
}
else {
var data = new Array(1000);
for (var i = 0; i < charstrings.length; i++) {
var glyph = charstrings[i].glyph;
if (glyph == ".notdef")
continue;
var pos = GlyphsUnicode[glyph];
if (!pos)
error(charstrings[i].glyph + " does not have an entry in the glyphs table");
var b1 = parseInt("0x" + pos[0] + pos[1]);
var b2 = parseInt("0x" + pos[2] + pos[3]);
var num = this.bytesToInteger([b1, b2]);
data[num] = i + 1;
}
var ranges = [];
var range = [];
for (var i = 0; i < data.length; i++) {
var char = data[i];
if (char) {
range.push(i);
} else if (range.length) {
//log("create a new range of " + range.length + " chars width min: " + range[0] + " to max: " + range[range.length - 1]);
ranges.push(range.slice());
range = [];
}
}
var cmap = [];
var segCount = ranges.length + 1;
var segCount2 = segCount * 2;
var searchRange = this.getMaxPower2(segCount) * 2;
var searchEntry = Math.log(segCount) / Math.log(2);
var rangeShift = 2 * segCount - searchRange;
cmap = cmap.concat(this.integerToBytes(segCount2, 2));
cmap = cmap.concat(this.integerToBytes(searchRange, 2));
cmap = cmap.concat(this.integerToBytes(searchEntry, 2));
cmap = cmap.concat(this.integerToBytes(rangeShift, 2));
// End characters code with an additional 0xFFFF to finish the array
var endCodes = [];
for (var i = 0; i < ranges.length; i++) {
var range = ranges[i];
cmap = cmap.concat(this.integerToBytes(range[range.length - 1], 2));
};
cmap = cmap.concat([0xFF, 0xFF]);
// reserved pad
cmap = cmap.concat([0x00, 0x00]);
// Start characters code with an additional 0xFFFF to finish the array
for (var i = 0; i < ranges.length; i++) {
var range = ranges[i];
cmap = cmap.concat(this.integerToBytes(range[0], 2));
};
cmap = cmap.concat([0xFF, 0xFF]);
// Fill idDelta
var idDelta = [];
var delta = 0;
var p = 1;
for (var i = 0; i < ranges.length; i++) {
var range = ranges[i];
var start = range[0];
var end = range[range.length - 1];
var diff = end - start;
var delta = -(start - p);
var value = this.integerToBytes(-delta, 2);
value[0] ^= 0xFF;
value[1] ^= 0xFF;
value[1] += 1;
cmap = cmap.concat([value[0], value[1]]);
delta -= range.length;
p += range.length;
};
cmap = cmap.concat([0x00, 0x01]);
// Fill id Offsets with 0x00
for (var i = 0; i < ranges.length; i++) {
var range = ranges[i];
cmap = cmap.concat([0x00, 0x00]);
};
cmap = cmap.concat([0x00, 0x00]);
var cmapHeader = [
0x00, 0x00, // version
0x00, 0x01, // numTables
0x00, 0x03, // platformID
0x00, 0x01, // encodingID
0x00, 0x00, 0x00, 0x0C, // start of the table record
0x00, 0x04 // format
];
cmapHeader = cmapHeader.concat(this.integerToBytes(cmap.length + 6, 2)); // length
cmapHeader = cmapHeader.concat(0x00, 0x00); // language
// Fill up data!
for (var i = 0; i < ranges.length; i++) {
var range = ranges[i];
for (var j = 0; j < range.length; j++) {
cmap = cmap.concat(range[j]);
}
};
cmap = cmapHeader.concat(cmap);
}
var tableEntry = this.createTableEntry("cmap", virtualOffset, cmap);
otf.set(tableEntry, currentOffset);
currentOffset += tableEntry.length;
virtualOffset += cmap.length;
/** HEAD */
var head = [
0x00, 0x01, 0x00, 0x00, // Version number
0x00, 0x00, 0x50, 0x00, // fontRevision
0x00, 0x00, 0x00, 0x00, // checksumAdjustement
0x5F, 0x0F, 0x3C, 0xF5, // magicNumber
0x00, 0x00, // Flags
0x03, 0xE8, // unitsPerEM (>= 16 && <=16384)
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, // created
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, // modified
0x00, 0x00, // xMin
0x00, 0x00, // yMin
0x00, 0x00, // xMax
0x00, 0x00, // yMax
0x00, 0x00, // macStyle
0x00, 0x00, // lowestRecPPEM
0x00, 0x00, // fontDirectionHint
0x00, 0x00, // indexToLocFormat
0x00, 0x00 // glyphDataFormat
];
var tableEntry = this.createTableEntry("head", virtualOffset, head);
otf.set(tableEntry, currentOffset);
currentOffset += tableEntry.length;
virtualOffset += head.length;
/** HHEA */
var hhea = [
0x00, 0x01, 0x00, 0x00, // Version number
0x00, 0x00, // Typographic Ascent
0x00, 0x00, // Typographic Descent
0x00, 0x00, // Line Gap
0xFF, 0xFF, // advanceWidthMax
0x00, 0x00, // minLeftSidebearing
0x00, 0x00, // minRightSidebearing
0x00, 0x00, // xMaxExtent
0x00, 0x00, // caretSlopeRise
0x00, 0x00, // caretSlopeRun
0x00, 0x00, // caretOffset
0x00, 0x00, // -reserved-
0x00, 0x00, // -reserved-
0x00, 0x00, // -reserved-
0x00, 0x00, // -reserved-
0x00, 0x00 // metricDataFormat
];
hhea = hhea.concat(this.integerToBytes(charstrings.length, 2)); // numberOfHMetrics
var tableEntry = this.createTableEntry("hhea", virtualOffset, hhea);
otf.set(tableEntry, currentOffset);
currentOffset += tableEntry.length;
virtualOffset += hhea.length;
/** HMTX */
var hmtx = [0x01, 0xF4, 0x00, 0x00];
for (var i = 0; i < charstrings.length; i++) {
var charstring = charstrings[i].charstring;
var width = this.integerToBytes(charstring[1], 2);
var lsb = this.integerToBytes(charstring[0], 2);
hmtx = hmtx.concat(width, lsb);
}
var tableEntry = this.createTableEntry("hmtx", virtualOffset, hmtx);
otf.set(tableEntry, currentOffset);
currentOffset += tableEntry.length;
virtualOffset += hmtx.length;
/** MAXP */
var maxp = [
0x00, 0x00, 0x50, 0x00, // Version number
].concat(this.integerToBytes(charstrings.length + 1, 2)); // Num of glyphs (+1 to pass the sanitizer...)
var tableEntry = this.createTableEntry("maxp", virtualOffset, maxp);
otf.set(tableEntry, currentOffset);
currentOffset += tableEntry.length;
virtualOffset += maxp.length;
/** NAME */
var name = [
0x00, 0x00, // format
0x00, 0x00, // Number of names Record
0x00, 0x00 // Storage
];
var tableEntry = this.createTableEntry("name", virtualOffset, name);
otf.set(tableEntry, currentOffset);
currentOffset += tableEntry.length;
virtualOffset += name.length;
/** POST */
// XXX get those info from the Font dict!
var post = [
0x00, 0x03, 0x00, 0x00, // Version number
0x00, 0x00, 0x01, 0x00, // italicAngle
0x00, 0x00, // underlinePosition
0x00, 0x00, // underlineThickness
0x00, 0x00, 0x00, 0x00, // isFixedPitch
0x00, 0x00, 0x00, 0x00, // minMemType42
0x00, 0x00, 0x00, 0x00, // maxMemType42
0x00, 0x00, 0x00, 0x00, // minMemType1
0x00, 0x00, 0x00, 0x00 // maxMemType1
];
var tableEntry = this.createTableEntry("post", virtualOffset, post);
otf.set(tableEntry, currentOffset);
currentOffset += tableEntry.length;
virtualOffset += post.length;
// Set the CFF data
otf.set(aData, currentOffset);
currentOffset += aData.length;
var tables = [OS2, cmap, head, hhea, hmtx, maxp, name, post];
for (var i = 0; i < tables.length; i++) {
var table = tables[i];
otf.set(table, currentOffset);
currentOffset += table.length;
}
var fontData = [];
for (var i = 0; i < currentOffset; i++)
fontData.push(otf[i]);
writeToFile(fontData, "/tmp/pdf.js.otf");
return fontData;
}
};