Guessing pdf char size based on the CMap numbers

author Yury Delendik <ydelendik@mozilla.com>

Mon, 23 Apr 2012 22:44:51 +0000 (17:44 -0500)

committer Yury Delendik <ydelendik@mozilla.com>

Mon, 23 Apr 2012 22:44:51 +0000 (17:44 -0500)
author Yury Delendik <ydelendik@mozilla.com>
Mon, 23 Apr 2012 22:44:51 +0000 (17:44 -0500)
committer Yury Delendik <ydelendik@mozilla.com>
Mon, 23 Apr 2012 22:44:51 +0000 (17:44 -0500)
diff --git a/src/evaluator.js b/src/evaluator.js

index e073942013e2bb2a0fb7982b67e7c04ef0aeba1b..23c9d1f657680cdf8f53143dacaceff36c7d3457 100644 (file)
--- a/src/evaluator.js
+++ b/src/evaluator.js
@@ -481,7 +481,7 @@ var PartialEvaluator = (function PartialEvaluatorClosure() {
        var toUnicode = dict.get('ToUnicode') ||
          baseDict.get('ToUnicode');
        if (toUnicode)
-        properties.toUnicode = this.readToUnicode(toUnicode, xref);
+        properties.toUnicode = this.readToUnicode(toUnicode, xref, properties);
  
        if (properties.composite) {
          // CIDSystemInfo helps to match CID to glyphs
@@ -537,7 +537,8 @@ var PartialEvaluator = (function PartialEvaluatorClosure() {
        properties.hasEncoding = hasEncoding;
      },
  
-    readToUnicode: function PartialEvaluator_readToUnicode(toUnicode, xref) {
+    readToUnicode: function PartialEvaluator_readToUnicode(toUnicode, xref,
+                                                           properties) {
        var cmapObj = toUnicode;
        var charToUnicode = [];
        if (isName(cmapObj)) {
@@ -626,6 +627,10 @@ var PartialEvaluator = (function PartialEvaluatorClosure() {
              }
            } else if (octet == 0x3E) {
              if (token.length) {
+              // XXX guessing chars size by checking number size in the CMap
+              if (token.length <= 2 && properties.composite)
+                properties.wideChars = false;
+
                if (token.length <= 4) {
                  // parsing hex number
                  tokens.push(parseInt(token, 16));
@@ -843,6 +848,7 @@ var PartialEvaluator = (function PartialEvaluatorClosure() {
          length1: length1,
          length2: length2,
          composite: composite,
+        wideChars: composite,
          fixedPitch: false,
          fontMatrix: dict.get('FontMatrix') || IDENTITY_MATRIX,
          firstChar: firstChar || 0,
diff --git a/src/fonts.js b/src/fonts.js

index 7bd3ddd0676b0867b4069fea3dc82fd63eeebc54..22037e7245bebbcfc1c723c0c88919ab7272d9b5 100644 (file)
--- a/src/fonts.js
+++ b/src/fonts.js
@@ -789,6 +789,7 @@ var Font = (function FontClosure() {
      this.widths = properties.widths;
      this.defaultWidth = properties.defaultWidth;
      this.composite = properties.composite;
+    this.wideChars = properties.wideChars;
      this.hasEncoding = properties.hasEncoding;
  
      this.fontMatrix = properties.fontMatrix;
@@ -2520,7 +2521,7 @@ var Font = (function FontClosure() {
  
        glyphs = [];
  
-      if (this.composite) {
+      if (this.wideChars) {
          // composite fonts have multi-byte strings convert the string from
          // single-byte to multi-byte
          // XXX assuming CIDFonts are two-byte - later need to extract the
author	Yury Delendik <ydelendik@mozilla.com>
	Mon, 23 Apr 2012 22:44:51 +0000 (17:44 -0500)
committer	Yury Delendik <ydelendik@mozilla.com>
	Mon, 23 Apr 2012 22:44:51 +0000 (17:44 -0500)
src/evaluator.js		patch \| blob \| history
src/fonts.js		patch \| blob \| history