web/lib/Zend/Pdf/Resource/Font/Simple.php
changeset 64 162c1de6545a
parent 19 1c2f13fd785c
child 68 ecaf28ffe26e
equal deleted inserted replaced
63:5b37998e522e 64:162c1de6545a
       
     1 <?php
       
     2 /**
       
     3  * Zend Framework
       
     4  *
       
     5  * LICENSE
       
     6  *
       
     7  * This source file is subject to the new BSD license that is bundled
       
     8  * with this package in the file LICENSE.txt.
       
     9  * It is also available through the world-wide-web at this URL:
       
    10  * http://framework.zend.com/license/new-bsd
       
    11  * If you did not receive a copy of the license and are unable to
       
    12  * obtain it through the world-wide-web, please send an email
       
    13  * to license@zend.com so we can send you a copy immediately.
       
    14  *
       
    15  * @category   Zend
       
    16  * @package    Zend_Pdf
       
    17  * @subpackage Fonts
       
    18  * @copyright  Copyright (c) 2005-2010 Zend Technologies USA Inc. (http://www.zend.com)
       
    19  * @license    http://framework.zend.com/license/new-bsd     New BSD License
       
    20  * @version    $Id: Simple.php 20096 2010-01-06 02:05:09Z bkarwin $
       
    21  */
       
    22 
       
    23 
       
    24 /** Internally used classes */
       
    25 require_once 'Zend/Pdf/Element/Name.php';
       
    26 
       
    27 
       
    28 /** Zend_Pdf_Resource_Font */
       
    29 require_once 'Zend/Pdf/Resource/Font.php';
       
    30 
       
    31 /**
       
    32  * Adobe PDF Simple fonts implementation
       
    33  *
       
    34  * PDF simple fonts functionality is presented by Adobe Type 1
       
    35  * (including standard PDF Type1 built-in fonts) and TrueType fonts support.
       
    36  *
       
    37  * Both fonts have the following properties:
       
    38  * - Glyphs in the font are selected by single-byte character codes obtained from a
       
    39  *   string that is shown by the text-showing operators. Logically, these codes index
       
    40  *   into a table of 256 glyphs; the mapping from codes to glyphs is called the font’s
       
    41  *   encoding.
       
    42  *   PDF specification provides a possibility to specify any user defined encoding in addition
       
    43  *   to the standard built-in encodings: Standard-Encoding, MacRomanEncoding, WinAnsiEncoding,
       
    44  *   and PDFDocEncoding, but Zend_Pdf simple fonts implementation operates only with
       
    45  *   Windows ANSI encoding (except Symbol and ZapfDingbats built-in fonts).
       
    46  *
       
    47  * - Each glyph has a single set of metrics, including a horizontal displacement or
       
    48  *   width. That is, simple fonts support only horizontal writing mode.
       
    49  *
       
    50  *
       
    51  * The code in this class is common to both types. However, you will only deal
       
    52  * directly with subclasses.
       
    53  *
       
    54  * Font objects should be normally be obtained from the factory methods
       
    55  * {@link Zend_Pdf_Font::fontWithName} and {@link Zend_Pdf_Font::fontWithPath}.
       
    56  *
       
    57  * @package    Zend_Pdf
       
    58  * @subpackage Fonts
       
    59  * @copyright  Copyright (c) 2005-2010 Zend Technologies USA Inc. (http://www.zend.com)
       
    60  * @license    http://framework.zend.com/license/new-bsd     New BSD License
       
    61  */
       
    62 abstract class Zend_Pdf_Resource_Font_Simple extends Zend_Pdf_Resource_Font
       
    63 {
       
    64     /**
       
    65      * Object representing the font's cmap (character to glyph map).
       
    66      * @var Zend_Pdf_Cmap
       
    67      */
       
    68     protected $_cmap = null;
       
    69 
       
    70     /**
       
    71      * Array containing the widths of each of the glyphs contained in the font.
       
    72      *
       
    73      * Keys are integers starting from 0, which coresponds to Zend_Pdf_Cmap::MISSING_CHARACTER_GLYPH.
       
    74      *
       
    75      * Font character map may contain gaps for actually used glyphs, nevertheless glyphWidths array
       
    76      * contains widths for all glyphs even they are unused.
       
    77      *
       
    78      * @var array
       
    79      */
       
    80     protected $_glyphWidths = null;
       
    81 
       
    82     /**
       
    83      * Width for glyphs missed in the font
       
    84      *
       
    85      * Note: Adobe PDF specfication (V1.4 - V1.6) doesn't define behavior for rendering
       
    86      * characters missed in the standard PDF fonts (such us 0x7F (DEL) Windows ANSI code)
       
    87      * Adobe Font Metrics files doesn't also define metrics for "missed glyph".
       
    88      * We provide character width as "0" for this case, but actually it depends on PDF viewer
       
    89      * implementation.
       
    90      *
       
    91      * @var integer
       
    92      */
       
    93     protected $_missingGlyphWidth = 0;
       
    94 
       
    95 
       
    96     /**** Public Interface ****/
       
    97 
       
    98 
       
    99   /* Object Lifecycle */
       
   100 
       
   101     /**
       
   102      * Object constructor
       
   103      *
       
   104      */
       
   105     public function __construct()
       
   106     {
       
   107         parent::__construct();
       
   108 
       
   109         /**
       
   110          * @todo
       
   111          * It's easy to add other encodings support now (Standard-Encoding, MacRomanEncoding,
       
   112          * PDFDocEncoding, MacExpertEncoding, Symbol, and ZapfDingbats).
       
   113          * Steps for the implementation:
       
   114          * - completely describe all PDF single byte encodings in the documentation
       
   115          * - implement non-WinAnsi encodings processing into encodeString()/decodeString() methods
       
   116          *
       
   117          * These encodings will be automatically supported for standard builtin PDF fonts as well
       
   118          * as for external fonts.
       
   119          */
       
   120         $this->_resource->Encoding = new Zend_Pdf_Element_Name('WinAnsiEncoding');
       
   121     }
       
   122 
       
   123     /**
       
   124      * Returns an array of glyph numbers corresponding to the Unicode characters.
       
   125      *
       
   126      * If a particular character doesn't exist in this font, the special 'missing
       
   127      * character glyph' will be substituted.
       
   128      *
       
   129      * See also {@link glyphNumberForCharacter()}.
       
   130      *
       
   131      * @param array $characterCodes Array of Unicode character codes (code points).
       
   132      * @return array Array of glyph numbers.
       
   133      */
       
   134     public function glyphNumbersForCharacters($characterCodes)
       
   135     {
       
   136         return $this->_cmap->glyphNumbersForCharacters($characterCodes);
       
   137     }
       
   138 
       
   139     /**
       
   140      * Returns the glyph number corresponding to the Unicode character.
       
   141      *
       
   142      * If a particular character doesn't exist in this font, the special 'missing
       
   143      * character glyph' will be substituted.
       
   144      *
       
   145      * See also {@link glyphNumbersForCharacters()} which is optimized for bulk
       
   146      * operations.
       
   147      *
       
   148      * @param integer $characterCode Unicode character code (code point).
       
   149      * @return integer Glyph number.
       
   150      */
       
   151     public function glyphNumberForCharacter($characterCode)
       
   152     {
       
   153         return $this->_cmap->glyphNumberForCharacter($characterCode);
       
   154     }
       
   155 
       
   156     /**
       
   157      * Returns a number between 0 and 1 inclusive that indicates the percentage
       
   158      * of characters in the string which are covered by glyphs in this font.
       
   159      *
       
   160      * Since no one font will contain glyphs for the entire Unicode character
       
   161      * range, this method can be used to help locate a suitable font when the
       
   162      * actual contents of the string are not known.
       
   163      *
       
   164      * Note that some fonts lie about the characters they support. Additionally,
       
   165      * fonts don't usually contain glyphs for control characters such as tabs
       
   166      * and line breaks, so it is rare that you will get back a full 1.0 score.
       
   167      * The resulting value should be considered informational only.
       
   168      *
       
   169      * @param string $string
       
   170      * @param string $charEncoding (optional) Character encoding of source text.
       
   171      *   If omitted, uses 'current locale'.
       
   172      * @return float
       
   173      */
       
   174     public function getCoveredPercentage($string, $charEncoding = '')
       
   175     {
       
   176         /* Convert the string to UTF-16BE encoding so we can match the string's
       
   177          * character codes to those found in the cmap.
       
   178          */
       
   179         if ($charEncoding != 'UTF-16BE') {
       
   180             if (PHP_OS != 'AIX') { // AIX doesnt know what UTF-16BE is
       
   181                 $string = iconv($charEncoding, 'UTF-16BE', $string);
       
   182             }
       
   183         }
       
   184 
       
   185         $charCount = (PHP_OS != 'AIX') ? iconv_strlen($string, 'UTF-16BE') : strlen($string);
       
   186         if ($charCount == 0) {
       
   187             return 0;
       
   188         }
       
   189 
       
   190         /* Fetch the covered character code list from the font's cmap.
       
   191          */
       
   192         $coveredCharacters = $this->_cmap->getCoveredCharacters();
       
   193 
       
   194         /* Calculate the score by doing a lookup for each character.
       
   195          */
       
   196         $score = 0;
       
   197         $maxIndex = strlen($string);
       
   198         for ($i = 0; $i < $maxIndex; $i++) {
       
   199             /**
       
   200              * @todo Properly handle characters encoded as surrogate pairs.
       
   201              */
       
   202             $charCode = (ord($string[$i]) << 8) | ord($string[++$i]);
       
   203             /* This could probably be optimized a bit with a binary search...
       
   204              */
       
   205             if (in_array($charCode, $coveredCharacters)) {
       
   206                 $score++;
       
   207             }
       
   208         }
       
   209         return $score / $charCount;
       
   210     }
       
   211 
       
   212     /**
       
   213      * Returns the widths of the glyphs.
       
   214      *
       
   215      * The widths are expressed in the font's glyph space. You are responsible
       
   216      * for converting to user space as necessary. See {@link unitsPerEm()}.
       
   217      *
       
   218      * See also {@link widthForGlyph()}.
       
   219      *
       
   220      * @param array &$glyphNumbers Array of glyph numbers.
       
   221      * @return array Array of glyph widths (integers).
       
   222      */
       
   223     public function widthsForGlyphs($glyphNumbers)
       
   224     {
       
   225         $widths = array();
       
   226         foreach ($glyphNumbers as $key => $glyphNumber) {
       
   227             if (!isset($this->_glyphWidths[$glyphNumber])) {
       
   228                 $widths[$key] = $this->_missingGlyphWidth;
       
   229             } else {
       
   230                 $widths[$key] = $this->_glyphWidths[$glyphNumber];
       
   231             }
       
   232         }
       
   233         return $widths;
       
   234     }
       
   235 
       
   236     /**
       
   237      * Returns the width of the glyph.
       
   238      *
       
   239      * Like {@link widthsForGlyphs()} but used for one glyph at a time.
       
   240      *
       
   241      * @param integer $glyphNumber
       
   242      * @return integer
       
   243      */
       
   244     public function widthForGlyph($glyphNumber)
       
   245     {
       
   246         if (!isset($this->_glyphWidths[$glyphNumber])) {
       
   247             return $this->_missingGlyphWidth;
       
   248         }
       
   249         return $this->_glyphWidths[$glyphNumber];
       
   250     }
       
   251 
       
   252     /**
       
   253      * Convert string to the font encoding.
       
   254      *
       
   255      * The method is used to prepare string for text drawing operators
       
   256      *
       
   257      * @param string $string
       
   258      * @param string $charEncoding Character encoding of source text.
       
   259      * @return string
       
   260      */
       
   261     public function encodeString($string, $charEncoding)
       
   262     {
       
   263         if (PHP_OS == 'AIX') {
       
   264             return $string; // returning here b/c AIX doesnt know what CP1252 is
       
   265         }
       
   266 
       
   267         return iconv($charEncoding, 'CP1252//IGNORE', $string);
       
   268     }
       
   269 
       
   270     /**
       
   271      * Convert string from the font encoding.
       
   272      *
       
   273      * The method is used to convert strings retrieved from existing content streams
       
   274      *
       
   275      * @param string $string
       
   276      * @param string $charEncoding Character encoding of resulting text.
       
   277      * @return string
       
   278      */
       
   279     public function decodeString($string, $charEncoding)
       
   280     {
       
   281         return iconv('CP1252', $charEncoding, $string);
       
   282     }
       
   283 }