1. Codes meant to be in hex are specified in decimal.
Consequently characters which don't need escaping are escaped.
2. Special handling (prepend backslash) needed for {, }, and \.
RTF docs generated with those characters cannot be opened in Word.
3. Tab character needs to be escaped as \tab.
RTF docs drop these characters.
While running test suite, found that Writer/RTF/ElementTest was coded
only for Unix line endings, and fails on Windows. Changed so that it
would work on either.
98 lines
3.1 KiB
PHP
98 lines
3.1 KiB
PHP
<?php
|
|
/**
|
|
* This file is part of PHPWord - A pure PHP library for reading and writing
|
|
* word processing documents.
|
|
*
|
|
* PHPWord is free software distributed under the terms of the GNU Lesser
|
|
* General Public License version 3 as published by the Free Software Foundation.
|
|
*
|
|
* For the full copyright and license information, please read the LICENSE
|
|
* file that was distributed with this source code. For the full list of
|
|
* contributors, visit https://github.com/PHPOffice/PHPWord/contributors.
|
|
*
|
|
* @see https://github.com/PHPOffice/PHPWord
|
|
* @copyright 2010-2018 PHPWord contributors
|
|
* @license http://www.gnu.org/licenses/lgpl.txt LGPL version 3
|
|
*/
|
|
|
|
namespace PhpOffice\PhpWord\Escaper;
|
|
|
|
/**
|
|
* @since 0.13.0
|
|
*
|
|
* @codeCoverageIgnore
|
|
*/
|
|
class Rtf extends AbstractEscaper
|
|
{
|
|
protected function escapeAsciiCharacter($code)
|
|
{
|
|
if ($code == 9) {
|
|
return '{\\tab}';
|
|
}
|
|
if (0x20 > $code || $code >= 0x80) {
|
|
return '{\\u' . $code . '}';
|
|
}
|
|
if ($code == 123 || $code == 125 || $code == 92) { // open or close brace or backslash
|
|
return '\\' . chr($code);
|
|
}
|
|
|
|
return chr($code);
|
|
}
|
|
|
|
protected function escapeMultibyteCharacter($code)
|
|
{
|
|
return '\\uc0{\\u' . $code . '}';
|
|
}
|
|
|
|
/**
|
|
* @see http://www.randomchaos.com/documents/?source=php_and_unicode
|
|
* @param string $input
|
|
*/
|
|
protected function escapeSingleValue($input)
|
|
{
|
|
$escapedValue = '';
|
|
|
|
$numberOfBytes = 1;
|
|
$bytes = array();
|
|
for ($i = 0; $i < strlen($input); ++$i) {
|
|
$character = $input[$i];
|
|
$asciiCode = ord($character);
|
|
|
|
if ($asciiCode < 128) {
|
|
$escapedValue .= $this->escapeAsciiCharacter($asciiCode);
|
|
} else {
|
|
if (0 == count($bytes)) {
|
|
if ($asciiCode < 224) {
|
|
$numberOfBytes = 2;
|
|
} elseif ($asciiCode < 240) {
|
|
$numberOfBytes = 3;
|
|
} elseif ($asciiCode < 248) {
|
|
$numberOfBytes = 4;
|
|
}
|
|
}
|
|
|
|
$bytes[] = $asciiCode;
|
|
|
|
if ($numberOfBytes == count($bytes)) {
|
|
if (4 == $numberOfBytes) {
|
|
$multibyteCode = ($bytes[0] % 8) * 262144 + ($bytes[1] % 64) * 4096 + ($bytes[2] % 64) * 64 + ($bytes[3] % 64);
|
|
} elseif (3 == $numberOfBytes) {
|
|
$multibyteCode = ($bytes[0] % 16) * 4096 + ($bytes[1] % 64) * 64 + ($bytes[2] % 64);
|
|
} else {
|
|
$multibyteCode = ($bytes[0] % 32) * 64 + ($bytes[1] % 64);
|
|
}
|
|
|
|
if (65279 != $multibyteCode) {
|
|
$escapedValue .= $multibyteCode < 128 ? $this->escapeAsciiCharacter($multibyteCode) : $this->escapeMultibyteCharacter($multibyteCode);
|
|
}
|
|
|
|
$numberOfBytes = 1;
|
|
$bytes = array();
|
|
}
|
|
}
|
|
}
|
|
|
|
return $escapedValue;
|
|
}
|
|
}
|