Blame view

export/PHPRtfLite-1.3.1/lib/PHPRtfLite/Utf8.php 3.49 KB
f90e19c3   Andrea Petta   plugin update
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
  <?php
  /*
      PHPRtfLite
      Copyright 2007-2008 Denis Slaveckij <sinedas@gmail.com>
      Copyright 2010-2012s Steffen Zeidler <sigma_z@sigma-scripts.de>
  
      This file is part of PHPRtfLite.
  
      PHPRtfLite is free software: you can redistribute it and/or modify
      it under the terms of the GNU Lesser General Public License as published by
      the Free Software Foundation, either version 3 of the License, or
      (at your option) any later version.
  
      PHPRtfLite is distributed in the hope that it will be useful,
      but WITHOUT ANY WARRANTY; without even the implied warranty of
      MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
      GNU Lesser General Public License for more details.
  
      You should have received a copy of the GNU Lesser General Public License
      along with PHPRtfLite.  If not, see <http://www.gnu.org/licenses/>.
  */
  
  /**
   * UTF8 class with static functions that converts utf8 characters into rtf utf8 entities.
   * @version     1.2
   * @author      Denis Slaveckij <sinedas@gmail.com>
   * @author      Steffen Zeidler <sigma_z@sigma-scripts.de>
   * @copyright   2007-2008 Denis Slaveckij, 2010-2012 Steffen Zeidler
   * @package     PHPRtfLite
   */
  class PHPRtfLite_Utf8
  {
  
      /**
       * converts text with utf8 characters into rtf utf8 entites
       *
       * @param string $text
       */
      public static function getUnicodeEntities($text, $inCharset)
      {
          if ($inCharset != 'UTF-8') {
              if (extension_loaded('iconv')) {
                  $text = iconv($inCharset, 'UTF-8//TRANSLIT', $text);
              }
              else {
                  throw new PHPRtfLite_Exception('Iconv extension is not available! '
                                               . 'Activate this extension or use UTF-8 encoded texts!');
              }
          }
          $text = self::utf8ToUnicode($text);
          return self::unicodeToEntitiesPreservingAscii($text);
      }
  
  
      /**
       * gets unicode for each character
       * @see http://www.randomchaos.com/documents/?source=php_and_unicode
       *
       * @return array
       */
      private static function utf8ToUnicode($str)
      {
          $unicode = array();
          $values = array();
          $lookingFor = 1;
  
          for ($i = 0; $i < strlen($str); $i++ ) {
              $thisValue = ord($str[$i]);
  
              if ($thisValue < 128) {
                  $unicode[] = $thisValue;
              }
              else {
                  if (count($values) == 0) {
                      $lookingFor = $thisValue < 224 ? 2 : 3;
                  }
  
                  $values[] = $thisValue;
  
                  if (count($values) == $lookingFor) {
                      $number = $lookingFor == 3
                                ? (($values[0] % 16) * 4096) + (($values[1] % 64) * 64) + ($values[2] % 64)
                                : (($values[0] % 32) * 64) + ($values[1] % 64);
  
                      $unicode[] = $number;
                      $values = array();
                      $lookingFor = 1;
                  }
              }
          }
  
          return $unicode;
      }
  
  
      /**
       * converts text with utf8 characters into rtf utf8 entites preserving ascii
       *
       * @param  string $unicode
       * @return string
       */
      private static function unicodeToEntitiesPreservingAscii($unicode)
      {
          $entities = '';
  
          foreach ($unicode as $value) {
              if ($value != 65279) {
                  $entities .= $value > 127
                               ? '\uc0{\u' . $value . '}'
                               : chr($value);
              }
          }
  
          return $entities;
      }
  
  }