RegEx.php 3.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107
  1. <?php
  2. /* Copyright (c) 2019 Geert Bergman (geert@scrivo.nl), highlight.php
  3. *
  4. * Redistribution and use in source and binary forms, with or without
  5. * modification, are permitted provided that the following conditions are met:
  6. *
  7. * 1. Redistributions of source code must retain the above copyright notice,
  8. * this list of conditions and the following disclaimer.
  9. * 2. Redistributions in binary form must reproduce the above copyright notice,
  10. * this list of conditions and the following disclaimer in the documentation
  11. * and/or other materials provided with the distribution.
  12. * 3. Neither the name of "highlight.js", "highlight.php", nor the names of its
  13. * contributors may be used to endorse or promote products derived from this
  14. * software without specific prior written permission.
  15. *
  16. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  17. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  18. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  19. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
  20. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  21. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  22. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  23. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  24. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  25. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  26. * POSSIBILITY OF SUCH DAMAGE.
  27. */
  28. namespace Highlight;
  29. /**
  30. * A PHP implementation to match JavaScript's RegExp class as closely as possible.
  31. *
  32. * A lot of behavior in this class is reversed engineered, so improvements are welcome!
  33. *
  34. * @internal
  35. *
  36. * @since 9.16.0
  37. */
  38. final class RegEx
  39. {
  40. /**
  41. * @var string
  42. */
  43. public $source;
  44. /**
  45. * @var int
  46. */
  47. public $lastIndex = 0;
  48. /**
  49. * @param RegEx|string $regex
  50. */
  51. public function __construct($regex)
  52. {
  53. $this->source = (string) $regex;
  54. }
  55. public function __toString()
  56. {
  57. return (string) $this->source;
  58. }
  59. /**
  60. * Run the regular expression against the given string.
  61. *
  62. * @since 9.16.0.0
  63. *
  64. * @param string $str the string to run this regular expression against
  65. *
  66. * @return RegExMatch|null
  67. */
  68. public function exec($str)
  69. {
  70. $index = null;
  71. $results = array();
  72. preg_match_all($this->source, $str, $results, PREG_SET_ORDER | PREG_OFFSET_CAPTURE, $this->lastIndex);
  73. if ($results === null || count($results) === 0) {
  74. return null;
  75. }
  76. foreach ($results[0] as &$result) {
  77. if ($result[1] !== -1) {
  78. // Only save the index if it hasn't been set yet
  79. if ($index === null) {
  80. $index = $result[1];
  81. }
  82. $result = $result[0];
  83. } else {
  84. $result = null;
  85. }
  86. }
  87. $results = $results[0];
  88. $this->lastIndex += mb_strlen($results[0]) + ($index - $this->lastIndex);
  89. $matches = new RegExMatch($results);
  90. $matches->index = isset($index) ? $index : 0;
  91. $matches->input = $str;
  92. return $matches;
  93. }
  94. }