Grammar.php 6.1KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179
  1. <?php
  2. /*
  3. * This file is part of SwiftMailer.
  4. * (c) 2004-2009 Chris Corbyn
  5. *
  6. * For the full copyright and license information, please view the LICENSE
  7. * file that was distributed with this source code.
  8. */
  9. /**
  10. * Defines the grammar to use for validation, implements the RFC 2822 (and friends) ABNF grammar definitions.
  11. * @package Swift
  12. * @subpackage Mime
  13. * @author Fabien Potencier
  14. * @author Chris Corbyn
  15. */
  16. class Swift_Mime_Grammar
  17. {
  18. /**
  19. * Special characters used in the syntax which need to be escaped.
  20. * @var string[]
  21. * @access private
  22. */
  23. private static $_specials = array();
  24. /**
  25. * Tokens defined in RFC 2822 (and some related RFCs).
  26. * @var string[]
  27. * @access private
  28. */
  29. private static $_grammar = array();
  30. /**
  31. * Initialize some RFC 2822 (and friends) ABNF grammar definitions.
  32. * @access protected
  33. */
  34. public function __construct()
  35. {
  36. $this->init();
  37. }
  38. public function __wakeup()
  39. {
  40. $this->init();
  41. }
  42. protected function init()
  43. {
  44. if(count(self::$_specials) > 0)
  45. {
  46. return;
  47. }
  48. self::$_specials = array(
  49. '(', ')', '<', '>', '[', ']',
  50. ':', ';', '@', ',', '.', '"'
  51. );
  52. /*** Refer to RFC 2822 for ABNF grammar ***/
  53. //All basic building blocks
  54. self::$_grammar['NO-WS-CTL'] = '[\x01-\x08\x0B\x0C\x0E-\x19\x7F]';
  55. self::$_grammar['WSP'] = '[ \t]';
  56. self::$_grammar['CRLF'] = '(?:\r\n)';
  57. self::$_grammar['FWS'] = '(?:(?:' . self::$_grammar['WSP'] . '*' .
  58. self::$_grammar['CRLF'] . ')?' . self::$_grammar['WSP'] . ')';
  59. self::$_grammar['text'] = '[\x00-\x08\x0B\x0C\x0E-\x7F]';
  60. self::$_grammar['quoted-pair'] = '(?:\\\\' . self::$_grammar['text'] . ')';
  61. self::$_grammar['ctext'] = '(?:' . self::$_grammar['NO-WS-CTL'] .
  62. '|[\x21-\x27\x2A-\x5B\x5D-\x7E])';
  63. //Uses recursive PCRE (?1) -- could be a weak point??
  64. self::$_grammar['ccontent'] = '(?:' . self::$_grammar['ctext'] . '|' .
  65. self::$_grammar['quoted-pair'] . '|(?1))';
  66. self::$_grammar['comment'] = '(\((?:' . self::$_grammar['FWS'] . '|' .
  67. self::$_grammar['ccontent']. ')*' . self::$_grammar['FWS'] . '?\))';
  68. self::$_grammar['CFWS'] = '(?:(?:' . self::$_grammar['FWS'] . '?' .
  69. self::$_grammar['comment'] . ')*(?:(?:' . self::$_grammar['FWS'] . '?' .
  70. self::$_grammar['comment'] . ')|' . self::$_grammar['FWS'] . '))';
  71. self::$_grammar['qtext'] = '(?:' . self::$_grammar['NO-WS-CTL'] .
  72. '|[\x21\x23-\x5B\x5D-\x7E])';
  73. self::$_grammar['qcontent'] = '(?:' . self::$_grammar['qtext'] . '|' .
  74. self::$_grammar['quoted-pair'] . ')';
  75. self::$_grammar['quoted-string'] = '(?:' . self::$_grammar['CFWS'] . '?"' .
  76. '(' . self::$_grammar['FWS'] . '?' . self::$_grammar['qcontent'] . ')*' .
  77. self::$_grammar['FWS'] . '?"' . self::$_grammar['CFWS'] . '?)';
  78. self::$_grammar['atext'] = '[a-zA-Z0-9!#\$%&\'\*\+\-\/=\?\^_`\{\}\|~]';
  79. self::$_grammar['atom'] = '(?:' . self::$_grammar['CFWS'] . '?' .
  80. self::$_grammar['atext'] . '+' . self::$_grammar['CFWS'] . '?)';
  81. self::$_grammar['dot-atom-text'] = '(?:' . self::$_grammar['atext'] . '+' .
  82. '(\.' . self::$_grammar['atext'] . '+)*)';
  83. self::$_grammar['dot-atom'] = '(?:' . self::$_grammar['CFWS'] . '?' .
  84. self::$_grammar['dot-atom-text'] . '+' . self::$_grammar['CFWS'] . '?)';
  85. self::$_grammar['word'] = '(?:' . self::$_grammar['atom'] . '|' .
  86. self::$_grammar['quoted-string'] . ')';
  87. self::$_grammar['phrase'] = '(?:' . self::$_grammar['word'] . '+?)';
  88. self::$_grammar['no-fold-quote'] = '(?:"(?:' . self::$_grammar['qtext'] .
  89. '|' . self::$_grammar['quoted-pair'] . ')*")';
  90. self::$_grammar['dtext'] = '(?:' . self::$_grammar['NO-WS-CTL'] .
  91. '|[\x21-\x5A\x5E-\x7E])';
  92. self::$_grammar['no-fold-literal'] = '(?:\[(?:' . self::$_grammar['dtext'] .
  93. '|' . self::$_grammar['quoted-pair'] . ')*\])';
  94. //Message IDs
  95. self::$_grammar['id-left'] = '(?:' . self::$_grammar['dot-atom-text'] . '|' .
  96. self::$_grammar['no-fold-quote'] . ')';
  97. self::$_grammar['id-right'] = '(?:' . self::$_grammar['dot-atom-text'] . '|' .
  98. self::$_grammar['no-fold-literal'] . ')';
  99. //Addresses, mailboxes and paths
  100. self::$_grammar['local-part'] = '(?:' . self::$_grammar['dot-atom'] . '|' .
  101. self::$_grammar['quoted-string'] . ')';
  102. self::$_grammar['dcontent'] = '(?:' . self::$_grammar['dtext'] . '|' .
  103. self::$_grammar['quoted-pair'] . ')';
  104. self::$_grammar['domain-literal'] = '(?:' . self::$_grammar['CFWS'] . '?\[(' .
  105. self::$_grammar['FWS'] . '?' . self::$_grammar['dcontent'] . ')*?' .
  106. self::$_grammar['FWS'] . '?\]' . self::$_grammar['CFWS'] . '?)';
  107. self::$_grammar['domain'] = '(?:' . self::$_grammar['dot-atom'] . '|' .
  108. self::$_grammar['domain-literal'] . ')';
  109. self::$_grammar['addr-spec'] = '(?:' . self::$_grammar['local-part'] . '@' .
  110. self::$_grammar['domain'] . ')';
  111. }
  112. /**
  113. * Get the grammar defined for $name token.
  114. * @param string $name execatly as written in the RFC
  115. * @return string
  116. */
  117. public function getDefinition($name)
  118. {
  119. if (array_key_exists($name, self::$_grammar))
  120. {
  121. return self::$_grammar[$name];
  122. }
  123. else
  124. {
  125. throw new Swift_RfcComplianceException(
  126. "No such grammar '" . $name . "' defined."
  127. );
  128. }
  129. }
  130. /**
  131. * Returns the tokens defined in RFC 2822 (and some related RFCs).
  132. * @return array
  133. */
  134. public function getGrammarDefinitions()
  135. {
  136. return self::$_grammar;
  137. }
  138. /**
  139. * Returns the current special characters used in the syntax which need to be escaped.
  140. * @return array
  141. */
  142. public function getSpecials()
  143. {
  144. return self::$_specials;
  145. }
  146. /**
  147. * Escape special characters in a string (convert to quoted-pairs).
  148. * @param string $token
  149. * @param string[] $include additonal chars to escape
  150. * @param string[] $exclude chars from escaping
  151. * @return string
  152. */
  153. public function escapeSpecials($token, $include = array(),
  154. $exclude = array())
  155. {
  156. foreach (
  157. array_merge(array('\\'), array_diff(self::$_specials, $exclude), $include) as $char)
  158. {
  159. $token = str_replace($char, '\\' . $char, $token);
  160. }
  161. return $token;
  162. }
  163. }