array( array("\\\\\\\\/:", "\\\\Q\\\\/:\\\\E"), ), // The expression []{}%#'" should be treated as a list of invalid characters, however the [] is special in PREG so // we use \Q and \E to have PREG treat them as literal characters "ada" => array( array("[]{}%#'\\\"", "\\\\Q[]{}%#'\\\"\\\\E"), ), // WTF, any ideas anyone? "mercury" => array(array("\\\\\\\/", "\\\\\\\\\\\/")), // The expression [^] is not allowed in PREG "lisp" => array(array("[^]", "[^|]")), // There's a typo in the Swift translation file "swift" => array(array( '{02B80}-9', '{02B8}0-9', )), ); for ($i = 0; $i < count($f); $i += 2) { if (!isset($f[$i + 1])) { continue; } $languageName = trim($f[$i]); $jsonLangDef = $f[$i + 1]; // The `-` character must be escaped in while in `[]`. This is enforced in PHP 7.3+ // https://wiki.php.net/rfc/pcre2-migration // https://github.com/php/php-src/pull/2857 $jsonLangDef = preg_replace('/(\[[^:]*?\w)(-)([^a-zA-Z0-9\\\\]+?)/um', '$1\\\\\\-$3', $jsonLangDef); if (!$languageName) { die(sprintf("ERROR: No language name on line %d\n", ($i + 1))); } if (!@json_decode($jsonLangDef)) { die(sprintf("ERROR: Invalid JSON data on line %d\n", ($i + 2))); } if (isset($patches[$languageName])) { foreach ($patches[$languageName] as $j => $patch) { $patched = str_replace($patch[0], $patch[1], $jsonLangDef); if ($jsonLangDef === $patched) { printf("Patch %d for %s was not applied and likely unnecessary\n", $j, $languageName); } $jsonLangDef = $patched; } } $jsonLangDef = json_encode(json_decode($jsonLangDef), JSON_UNESCAPED_UNICODE | JSON_PRETTY_PRINT) . "\n"; if (!file_put_contents("../Highlight/languages/{$languageName}.json", $jsonLangDef)) { die("ERROR: Couldn't write to file.\n"); } }