Files
luos/gulliver/thirdparty/html2ps_pdf/manager.encoding.php

247 lines
7.1 KiB
PHP
Executable File

<?php
require_once(HTML2PS_DIR.'encoding.inc.php');
require_once(HTML2PS_DIR.'encoding.entities.inc.php');
require_once(HTML2PS_DIR.'encoding.glyphs.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-1.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-2.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-3.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-4.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-5.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-6.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-7.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-8.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-9.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-10.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-11.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-13.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-14.inc.php');
require_once(HTML2PS_DIR.'encoding.iso-8859-15.inc.php');
require_once(HTML2PS_DIR.'encoding.koi8-r.inc.php');
require_once(HTML2PS_DIR.'encoding.cp866.inc.php');
require_once(HTML2PS_DIR.'encoding.windows-1250.inc.php');
require_once(HTML2PS_DIR.'encoding.windows-1251.inc.php');
require_once(HTML2PS_DIR.'encoding.windows-1252.inc.php');
require_once(HTML2PS_DIR.'encoding.dingbats.inc.php');
require_once(HTML2PS_DIR.'encoding.symbol.inc.php');
// TODO: this works for PS encoding names only
class ManagerEncoding {
var $_encodings;
var $_custom_vector_name;
var $_utf8_mapping;
function getMapping($char) {
if (!isset($this->_utf8_mapping)) {
$this->_loadMapping(CACHE_DIR . 'utf8.mappings.dat');
};
if (!isset($this->_utf8_mapping[$char])) {
return null;
};
return $this->_utf8_mapping[$char];
}
function _loadMapping($mapping_file) {
if (!is_readable($mapping_file)) {
$this->_generateMapping($mapping_file);
} else {
$this->_utf8_mapping = unserialize(file_get_contents($mapping_file));
};
}
function _generateMapping($mapping_file) {
global $g_utf8_converters;
$this->_utf8_mapping = array();
foreach (array_keys($g_utf8_converters) as $encoding) {
$flipped = array_flip($g_utf8_converters[$encoding][0]);
foreach ($flipped as $utf => $code) {
$this->_utf8_mapping[code_to_utf8($utf)][$encoding] = $code;
};
};
$file = fopen($mapping_file,'w');
fwrite($file, serialize($this->_utf8_mapping));
fclose($file);
}
function ManagerEncoding() {
$this->_encodings = array();
$this->registerCustomEncoding("custom", array(0,1,2,3,4,5,6,7,8,9,10,
11,12,13,14,15,16,17,18,19,20,
21,22,23,24,25,26,27,28,29,30,
31,32));
}
function getCanonizedEncodingName($encoding) {
global $g_encoding_aliases;
if (isset($g_encoding_aliases[$encoding])) {
return $g_encoding_aliases[$encoding];
};
return $encoding;
}
function registerCustomEncoding($name, $vector) {
$this->registerEncoding($name, $vector);
$this->_custom_vector_name = $name;
}
function getCustomEncodingName() {
return $this->_custom_vector_name;
}
function getCustomEncodingVector() {
return $this->_encodings[$this->getCustomEncodingName()];
}
function registerEncoding($name, $vector) {
$this->_encodings[$name] = $vector;
}
/**
* @TODO: handle more than 256 custom characters
*/
function addCustomChar($char) {
$vector_name = $this->getCustomEncodingName();
$index = count($this->_encodings[$vector_name]);
$this->_encodings[$vector_name][$index] = $char;
$this->_utf8_mapping[chr($index)]['custom'] = $char;
return chr($index);
}
/**
* Get an encoding vector (array containing 256 elements; every
* element is an ucs-2 encoded character)
*
* @param $encoding Encoding name
*
* @return Array encoding vector; null if this encoding is not known to the script
*/
function getEncodingVector($encoding) {
$encoding = $this->getCanonizedEncodingName($encoding);
/**
* @TODO: HACK. Currently custom encoding and "standard" encodings
* are handled separately, so we must explicitly check if current
* encoding is custom
*/
if ($encoding == $this->getCustomEncodingName()) {
$vector = array();
$custom_vector = $this->getCustomEncodingVector();
$size = count($custom_vector);
for ($i=0; $i<$size; $i++) {
$vector[chr($i)] = $custom_vector[$i];
};
} else {
global $g_utf8_converters;
if (!isset($g_utf8_converters[$encoding])) {
return null;
};
$vector = $g_utf8_converters[$encoding][0];
};
for ($i=0; $i<=255; $i++) {
if (!isset($vector[chr($i)])) {
$vector[chr($i)] = 0xFFFF;
};
};
return $vector;
}
function &get() {
global $g_manager_encodings;
return $g_manager_encodings;
}
function get_encoding_glyphs($encoding) {
$vector = $this->getEncodingVector($encoding);
if (is_null($vector)) {
error_log(sprintf("Cannot get encoding vector for encoding '%s'", $encoding));
return null;
};
return $this->vector_to_glyphs($vector);
}
function get_glyph_to_code_mapping($encoding) {
$vector = $this->getEncodingVector($encoding);
$result = array();
foreach ($vector as $code => $uccode) {
if (isset($GLOBALS['g_unicode_glyphs'][$uccode])) {
$result[$GLOBALS['g_unicode_glyphs'][$uccode]][] = $code;
};
};
return $result;
}
function vector_to_glyphs($vector) {
$result = array();
foreach ($vector as $code => $ucs2) {
if (isset($GLOBALS['g_unicode_glyphs'][$ucs2])) {
$result[$code] = $GLOBALS['g_unicode_glyphs'][$ucs2];
} elseif ($ucs2 == 0xFFFF) {
$result[$code] = ".notdef";
} else {
// Use "Unicode and Glyph Names" mapping from Adobe
// http://partners.adobe.com/public/developer/opentype/index_glyph.html
$result[$code] = sprintf("u%04X", $ucs2);
};
};
return $result;
}
function get_ps_encoding_vector($encoding) {
$vector = $this->getEncodingVector($encoding);
$result = "/".$encoding." [ \n";
for ($i=0; $i<256; $i++) {
if ($i % 10 == 0) { $result .= "\n"; };
// ! Note the order of array checking; optimizing interpreters may break this
if (isset($vector[chr($i)]) && isset($GLOBALS['g_unicode_glyphs'][$vector[chr($i)]])) {
$result .= " /".$GLOBALS['g_unicode_glyphs'][$vector[chr($i)]];
} else {
$result .= " /.notdef";
};
};
$result .= " ] readonly def";
return $result;
}
function getNextUTF8Char($raw_content, &$ptr) {
if ((ord($raw_content{$ptr}) & 0xF0) == 0xF0) {
$charlen = 4;
} elseif ((ord($raw_content{$ptr}) & 0xE0) == 0xE0) {
$charlen = 3;
} elseif ((ord($raw_content{$ptr}) & 0xC0) == 0xC0) {
$charlen = 2;
} else {
$charlen = 1;
};
$char = substr($raw_content,$ptr,$charlen);
$ptr += $charlen;
return $char;
}
}
global $g_manager_encodings;
$g_manager_encodings = new ManagerEncoding;
?>