Grammar.php 6.7KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175
  1. <?php
  2. /*
  3. * This file is part of SwiftMailer.
  4. * (c) 2004-2009 Chris Corbyn
  5. *
  6. * For the full copyright and license information, please view the LICENSE
  7. * file that was distributed with this source code.
  8. */
  9. /**
  10. * Defines the grammar to use for validation, implements the RFC 2822 (and friends) ABNF grammar definitions.
  11. * @package Swift
  12. * @subpackage Mime
  13. * @author Fabien Potencier
  14. * @author Chris Corbyn
  15. */
  16. class Swift_Mime_Grammar
  17. {
  18. /**
  19. * Special characters used in the syntax which need to be escaped.
  20. * @var string[]
  21. * @access private
  22. */
  23. private static $_specials = array();
  24. /**
  25. * Tokens defined in RFC 2822 (and some related RFCs).
  26. * @var string[]
  27. * @access private
  28. */
  29. private static $_grammar = array();
  30. /**
  31. * Initialize some RFC 2822 (and friends) ABNF grammar definitions.
  32. * @access protected
  33. */
  34. public function __construct()
  35. {
  36. $this->init();
  37. }
  38. public function __wakeup()
  39. {
  40. $this->init();
  41. }
  42. protected function init()
  43. {
  44. if (count(self::$_specials) > 0) {
  45. return;
  46. }
  47. self::$_specials = array(
  48. '(', ')', '<', '>', '[', ']',
  49. ':', ';', '@', ',', '.', '"'
  50. );
  51. /*** Refer to RFC 2822 for ABNF grammar ***/
  52. //All basic building blocks
  53. self::$_grammar['NO-WS-CTL'] = '[\x01-\x08\x0B\x0C\x0E-\x19\x7F]';
  54. self::$_grammar['WSP'] = '[ \t]';
  55. self::$_grammar['CRLF'] = '(?:\r\n)';
  56. self::$_grammar['FWS'] = '(?:(?:' . self::$_grammar['WSP'] . '*' .
  57. self::$_grammar['CRLF'] . ')?' . self::$_grammar['WSP'] . ')';
  58. self::$_grammar['text'] = '[\x00-\x08\x0B\x0C\x0E-\x7F]';
  59. self::$_grammar['quoted-pair'] = '(?:\\\\' . self::$_grammar['text'] . ')';
  60. self::$_grammar['ctext'] = '(?:' . self::$_grammar['NO-WS-CTL'] .
  61. '|[\x21-\x27\x2A-\x5B\x5D-\x7E])';
  62. //Uses recursive PCRE (?1) -- could be a weak point??
  63. self::$_grammar['ccontent'] = '(?:' . self::$_grammar['ctext'] . '|' .
  64. self::$_grammar['quoted-pair'] . '|(?1))';
  65. self::$_grammar['comment'] = '(\((?:' . self::$_grammar['FWS'] . '|' .
  66. self::$_grammar['ccontent']. ')*' . self::$_grammar['FWS'] . '?\))';
  67. self::$_grammar['CFWS'] = '(?:(?:' . self::$_grammar['FWS'] . '?' .
  68. self::$_grammar['comment'] . ')*(?:(?:' . self::$_grammar['FWS'] . '?' .
  69. self::$_grammar['comment'] . ')|' . self::$_grammar['FWS'] . '))';
  70. self::$_grammar['qtext'] = '(?:' . self::$_grammar['NO-WS-CTL'] .
  71. '|[\x21\x23-\x5B\x5D-\x7E])';
  72. self::$_grammar['qcontent'] = '(?:' . self::$_grammar['qtext'] . '|' .
  73. self::$_grammar['quoted-pair'] . ')';
  74. self::$_grammar['quoted-string'] = '(?:' . self::$_grammar['CFWS'] . '?"' .
  75. '(' . self::$_grammar['FWS'] . '?' . self::$_grammar['qcontent'] . ')*' .
  76. self::$_grammar['FWS'] . '?"' . self::$_grammar['CFWS'] . '?)';
  77. self::$_grammar['atext'] = '[a-zA-Z0-9!#\$%&\'\*\+\-\/=\?\^_`\{\}\|~]';
  78. self::$_grammar['atom'] = '(?:' . self::$_grammar['CFWS'] . '?' .
  79. self::$_grammar['atext'] . '+' . self::$_grammar['CFWS'] . '?)';
  80. self::$_grammar['dot-atom-text'] = '(?:' . self::$_grammar['atext'] . '+' .
  81. '(\.' . self::$_grammar['atext'] . '+)*)';
  82. self::$_grammar['dot-atom'] = '(?:' . self::$_grammar['CFWS'] . '?' .
  83. self::$_grammar['dot-atom-text'] . '+' . self::$_grammar['CFWS'] . '?)';
  84. self::$_grammar['word'] = '(?:' . self::$_grammar['atom'] . '|' .
  85. self::$_grammar['quoted-string'] . ')';
  86. self::$_grammar['phrase'] = '(?:' . self::$_grammar['word'] . '+?)';
  87. self::$_grammar['no-fold-quote'] = '(?:"(?:' . self::$_grammar['qtext'] .
  88. '|' . self::$_grammar['quoted-pair'] . ')*")';
  89. self::$_grammar['dtext'] = '(?:' . self::$_grammar['NO-WS-CTL'] .
  90. '|[\x21-\x5A\x5E-\x7E])';
  91. self::$_grammar['no-fold-literal'] = '(?:\[(?:' . self::$_grammar['dtext'] .
  92. '|' . self::$_grammar['quoted-pair'] . ')*\])';
  93. //Message IDs
  94. self::$_grammar['id-left'] = '(?:' . self::$_grammar['dot-atom-text'] . '|' .
  95. self::$_grammar['no-fold-quote'] . ')';
  96. self::$_grammar['id-right'] = '(?:' . self::$_grammar['dot-atom-text'] . '|' .
  97. self::$_grammar['no-fold-literal'] . ')';
  98. //Addresses, mailboxes and paths
  99. self::$_grammar['local-part'] = '(?:' . self::$_grammar['dot-atom'] . '|' .
  100. self::$_grammar['quoted-string'] . ')';
  101. self::$_grammar['dcontent'] = '(?:' . self::$_grammar['dtext'] . '|' .
  102. self::$_grammar['quoted-pair'] . ')';
  103. self::$_grammar['domain-literal'] = '(?:' . self::$_grammar['CFWS'] . '?\[(' .
  104. self::$_grammar['FWS'] . '?' . self::$_grammar['dcontent'] . ')*?' .
  105. self::$_grammar['FWS'] . '?\]' . self::$_grammar['CFWS'] . '?)';
  106. self::$_grammar['domain'] = '(?:' . self::$_grammar['dot-atom'] . '|' .
  107. self::$_grammar['domain-literal'] . ')';
  108. self::$_grammar['addr-spec'] = '(?:' . self::$_grammar['local-part'] . '@' .
  109. self::$_grammar['domain'] . ')';
  110. }
  111. /**
  112. * Get the grammar defined for $name token.
  113. * @param string $name execatly as written in the RFC
  114. * @return string
  115. */
  116. public function getDefinition($name)
  117. {
  118. if (array_key_exists($name, self::$_grammar)) {
  119. return self::$_grammar[$name];
  120. } else {
  121. throw new Swift_RfcComplianceException(
  122. "No such grammar '" . $name . "' defined."
  123. );
  124. }
  125. }
  126. /**
  127. * Returns the tokens defined in RFC 2822 (and some related RFCs).
  128. * @return array
  129. */
  130. public function getGrammarDefinitions()
  131. {
  132. return self::$_grammar;
  133. }
  134. /**
  135. * Returns the current special characters used in the syntax which need to be escaped.
  136. * @return array
  137. */
  138. public function getSpecials()
  139. {
  140. return self::$_specials;
  141. }
  142. /**
  143. * Escape special characters in a string (convert to quoted-pairs).
  144. * @param string $token
  145. * @param string[] $include additonal chars to escape
  146. * @param string[] $exclude chars from escaping
  147. * @return string
  148. */
  149. public function escapeSpecials($token, $include = array(), $exclude = array())
  150. {
  151. foreach (
  152. array_merge(array('\\'), array_diff(self::$_specials, $exclude), $include) as $char)
  153. {
  154. $token = str_replace($char, '\\' . $char, $token);
  155. }
  156. return $token;
  157. }
  158. }