. */ declare(strict_types=1); namespace Fisharebest\Webtrees\Report; use Fisharebest\Webtrees\I18N; use function ord; use function preg_replace; use function str_contains; use function str_pad; use function str_replace; use function strlen; use function strpos; use function strrpos; use function strtolower; use function strtoupper; use function substr; use const STR_PAD_LEFT; use const STR_PAD_RIGHT; /** * RTL Functions for use in the PDF reports */ class RightToLeftSupport { private const UTF8_LRM = "\xE2\x80\x8E"; // U+200E (Left to Right mark: zero-width character with LTR directionality) private const UTF8_RLM = "\xE2\x80\x8F"; // U+200F (Right to Left mark: zero-width character with RTL directionality) private const UTF8_LRO = "\xE2\x80\xAD"; // U+202D (Left to Right override: force everything following to LTR mode) private const UTF8_RLO = "\xE2\x80\xAE"; // U+202E (Right to Left override: force everything following to RTL mode) private const UTF8_LRE = "\xE2\x80\xAA"; // U+202A (Left to Right embedding: treat everything following as LTR text) private const UTF8_RLE = "\xE2\x80\xAB"; // U+202B (Right to Left embedding: treat everything following as RTL text) private const UTF8_PDF = "\xE2\x80\xAC"; // U+202C (Pop directional formatting: restore state prior to last LRO, RLO, LRE, RLE) private const OPEN_PARENTHESES = '([{'; private const CLOSE_PARENTHESES = ')]}'; private const NUMBERS = '0123456789'; private const NUMBER_PREFIX = '+-'; // Treat these like numbers when at beginning or end of numeric strings private const NUMBER_PUNCTUATION = '- ,.:/'; // Treat these like numbers when inside numeric strings private const PUNCTUATION = ',.:;?!'; // Markup private const START_LTR = ''; private const END_LTR = ''; private const START_RTL = ''; private const END_RTL = ''; private const LENGTH_START = 5; private const LENGTH_END = 6; /* Were we previously processing LTR or RTL. */ private static string $previousState; /* Are we currently processing LTR or RTL. */ private static string $currentState; /* Text waiting to be processed. */ private static string $waitingText; /* Offset into the text. */ private static int $posSpanStart; /** * This function strips ‎ and ‏ from the input string. It should be used for all * text that has been passed through the PrintReady() function before that text is stored * in the database. The database should NEVER contain these characters. * * @param string $inputText The string from which the ‎ and ‏ characters should be stripped * * @return string The input string, with ‎ and ‏ stripped */ private static function stripLrmRlm(string $inputText): string { return str_replace([ self::UTF8_LRM, self::UTF8_RLM, self::UTF8_LRO, self::UTF8_RLO, self::UTF8_LRE, self::UTF8_RLE, self::UTF8_PDF, '‎', '‏', '‎', '‏', ], '', $inputText); } /** * This function encapsulates all texts in the input with and * according to the directionality specified. * * @param string $inputText Raw input * * @return string The string with all texts encapsulated as required */ public static function spanLtrRtl(string $inputText): string { if ($inputText === '') { // Nothing to do return ''; } $workingText = str_replace("\n", '
', $inputText); $workingText = str_replace([ '
', 'class="starredname">', ], '
', $workingText); // Reposition some incorrectly placed line breaks $workingText = self::stripLrmRlm($workingText); // Get rid of any existing UTF8 control codes self::$previousState = ''; self::$currentState = strtoupper(I18N::direction()); $numberState = false; // Set when we're inside a numeric string $result = ''; self::$waitingText = ''; $openParDirection = []; self::beginCurrentSpan($result); while ($workingText !== '') { $charArray = self::getChar($workingText, 0); // Get the next ASCII or UTF-8 character $currentLetter = $charArray['letter']; $currentLen = $charArray['length']; $openParIndex = strpos(self::OPEN_PARENTHESES, $currentLetter); // Which opening parenthesis is this? $closeParIndex = strpos(self::CLOSE_PARENTHESES, $currentLetter); // Which closing parenthesis is this? switch ($currentLetter) { case '<': // Assume this '<' starts an HTML element $endPos = strpos($workingText, '>'); // look for the terminating '>' if ($endPos === false) { $endPos = 0; } $currentLen += $endPos; $element = substr($workingText, 0, $currentLen); $temp = strtolower(substr($element, 0, 3)); if (strlen($element) < 7 && $temp === '= 'A' && $currentLetter <= 'Z' || $currentLetter >= 'a' && $currentLetter <= 'z') { // Since it’s neither Hebrew nor Arabic, this UTF-8 character or ASCII letter must be LTR $newState = 'LTR'; break; } if ($closeParIndex !== false) { // This closing parenthesis has to inherit the matching opening parenthesis' directionality if (!empty($openParDirection[$closeParIndex]) && $openParDirection[$closeParIndex] !== '?') { $newState = $openParDirection[$closeParIndex]; } $openParDirection[$closeParIndex] = ''; break; } if ($openParIndex !== false) { // Opening parentheses always inherit the following directionality self::$waitingText .= $currentLetter; $workingText = substr($workingText, $currentLen); while (true) { if ($workingText === '') { break; } if (substr($workingText, 0, 1) === ' ') { // Spaces following this left parenthesis inherit the following directionality too self::$waitingText .= ' '; $workingText = substr($workingText, 1); continue; } if (substr($workingText, 0, 6) === ' ') { // Spaces following this left parenthesis inherit the following directionality too self::$waitingText .= ' '; $workingText = substr($workingText, 6); continue; } break; } $openParDirection[$openParIndex] = '?'; break 2; // double break because we're waiting for more information } // We have a digit or a "normal" special character. // // When this character is not at the start of the input string, it inherits the preceding directionality; // at the start of the input string, it assumes the following directionality. // // Exceptions to this rule will be handled later during final clean-up. // self::$waitingText .= $currentLetter; $workingText = substr($workingText, $currentLen); if (self::$currentState !== '') { $result .= self::$waitingText; self::$waitingText = ''; } break 2; // double break because we're waiting for more information } if ($newState !== self::$currentState) { // A direction change has occurred self::finishCurrentSpan($result); self::$previousState = self::$currentState; self::$currentState = $newState; self::beginCurrentSpan($result); } self::$waitingText .= $currentLetter; $workingText = substr($workingText, $currentLen); $result .= self::$waitingText; self::$waitingText = ''; foreach ($openParDirection as $index => $value) { // Since we now know the proper direction, remember it for all waiting opening parentheses if ($value === '?') { $openParDirection[$index] = self::$currentState; } } break; } } // We're done. Finish last if necessary if ($numberState) { if (self::$waitingText === '') { if (self::$currentState === 'RTL') { $result .= self::UTF8_PDF; } } elseif (self::$currentState === 'RTL') { self::$waitingText .= self::UTF8_PDF; } } self::finishCurrentSpan($result, true); // Get rid of any waiting text if (self::$waitingText !== '') { if (I18N::direction() === 'rtl' && self::$currentState === 'LTR') { $result .= self::START_RTL; $result .= self::$waitingText; $result .= self::END_RTL; } else { $result .= self::START_LTR; $result .= self::$waitingText; $result .= self::END_LTR; } self::$waitingText = ''; } // Lastly, do some more cleanups // Move leading RTL numeric strings to following LTR text // (this happens when the page direction is RTL and the original text begins with a number and is followed by LTR text) while (substr($result, 0, self::LENGTH_START + 3) === self::START_RTL . self::UTF8_LRE) { $spanEnd = strpos($result, self::END_RTL . self::START_LTR); if ($spanEnd === false) { break; } $textSpan = self::stripLrmRlm(substr($result, self::LENGTH_START + 3, $spanEnd - self::LENGTH_START - 3)); if (I18N::scriptDirection(I18N::textScript($textSpan)) === 'rtl') { break; } $result = self::START_LTR . substr($result, self::LENGTH_START, $spanEnd - self::LENGTH_START) . substr($result, $spanEnd + self::LENGTH_START + self::LENGTH_END); break; } // On RTL pages, put trailing "." in RTL numeric strings into its own RTL span if (I18N::direction() === 'rtl') { $result = str_replace(self::UTF8_PDF . '.' . self::END_RTL, self::UTF8_PDF . self::END_RTL . self::START_RTL . '.' . self::END_RTL, $result); } // Trim trailing blanks preceding
in LTR text while (self::$previousState !== 'RTL') { if (str_contains($result, ' ')) { $result = str_replace(' ', '', $result); continue; } if (str_contains($result, ' ')) { $result = str_replace(' ', '', $result); continue; } if (str_contains($result, '
')) { $result = str_replace('
', '
', $result); continue; } if (str_contains($result, ' 
')) { $result = str_replace(' 
', '
', $result); continue; } break; // Neither space nor   : we're done } // Trim trailing blanks preceding
in RTL text while (true) { if (str_contains($result, ' ')) { $result = str_replace(' ', '', $result); continue; } if (str_contains($result, ' ')) { $result = str_replace(' ', '', $result); continue; } break; // Neither space nor   : we're done } // Convert '' and '', '', ], [ self::END_LTR . '
' . self::START_LTR, self::END_RTL . '
' . self::START_RTL, ], $result); // Include leading indeterminate directional text in whatever follows if (substr($result . "\n", 0, self::LENGTH_START) !== self::START_LTR && substr($result . "\n", 0, self::LENGTH_START) !== self::START_RTL && substr($result . "\n", 0, 4) !== '
') { $leadingText = ''; while (true) { if ($result === '') { $result = $leadingText; break; } if (substr($result . "\n", 0, self::LENGTH_START) !== self::START_LTR && substr($result . "\n", 0, self::LENGTH_START) !== self::START_RTL) { $leadingText .= substr($result, 0, 1); $result = substr($result, 1); continue; } $result = substr($result, 0, self::LENGTH_START) . $leadingText . substr($result, self::LENGTH_START); break; } } // Include solitary "-" and "+" in surrounding RTL text $result = str_replace([ self::END_RTL . self::START_LTR . '-' . self::END_LTR . self::START_RTL, self::END_RTL . self::START_LTR . '+' . self::END_LTR . self::START_RTL, ], [ '-', '+', ], $result); //$result = strtr($result, [ // self::END_RTL . self::START_LTR . '-' . self::END_LTR . self::START_RTL => '-', // self::END_RTL . self::START_LTR . '+' . self::END_LTR . self::START_RTL => '+', //]); // Remove empty spans $result = str_replace([ self::START_LTR . self::END_LTR, self::START_RTL . self::END_RTL, ], '', $result); // Finally, correct '', '', '', and '' // LTR text: text // RTL text: text $result = str_replace([ self::START_LTR, self::END_LTR, self::START_RTL, self::END_RTL, ], [ '', '', '', '', ], $result); return $result; } /** * Wrap words that have an asterisk suffix in and tags. * This should underline starred names to show the preferred name. * * @param string $textSpan * @param string $direction * * @return string */ private static function starredName(string $textSpan, string $direction): string { // To avoid a TCPDF bug that mixes up the word order, insert those and tags // only when page and span directions are identical. if ($direction === strtoupper(I18N::direction())) { while (true) { $starPos = strpos($textSpan, '*'); if ($starPos === false) { break; } $trailingText = substr($textSpan, $starPos + 1); $textSpan = substr($textSpan, 0, $starPos); $wordStart = strrpos($textSpan, ' '); // Find the start of the word if ($wordStart !== false) { $leadingText = substr($textSpan, 0, $wordStart + 1); $wordText = substr($textSpan, $wordStart + 1); } else { $leadingText = ''; $wordText = $textSpan; } $textSpan = $leadingText . '' . $wordText . '' . $trailingText; } $textSpan = preg_replace('~(.*)~', '\1', $textSpan); // The   is a work-around for a TCPDF bug eating blanks. $textSpan = str_replace([ ' ', ' ', ], [ ' ', ' ', ], $textSpan); } else { // Text and page directions differ: remove the and $textSpan = preg_replace('~(.*)\*~', '\1', $textSpan); $textSpan = preg_replace('~(.*)~', '\1', $textSpan); } return $textSpan; } /** * Get the next character from an input string * * @param string $text * @param int $offset * * @return array{'letter':string,'length':int} */ private static function getChar(string $text, int $offset): array { if ($text === '') { return [ 'letter' => '', 'length' => 0, ]; } $char = substr($text, $offset, 1); $length = 1; if ((ord($char) & 0xE0) === 0xC0) { $length = 2; } if ((ord($char) & 0xF0) === 0xE0) { $length = 3; } if ((ord($char) & 0xF8) === 0xF0) { $length = 4; } $letter = substr($text, $offset, $length); return [ 'letter' => $letter, 'length' => $length, ]; } /** * Insert
into current span * * @param string $result * * @return void */ private static function breakCurrentSpan(string &$result): void { // Interrupt the current span, insert that
, and then continue the current span $result .= self::$waitingText; self::$waitingText = ''; $breakString = '<' . self::$currentState . 'br>'; $result .= $breakString; } /** * Begin current span * * @param string $result * * @return void */ private static function beginCurrentSpan(string &$result): void { if (self::$currentState === 'LTR') { $result .= self::START_LTR; } if (self::$currentState === 'RTL') { $result .= self::START_RTL; } self::$posSpanStart = strlen($result); } /** * Finish current span * * @param string $result * @param bool $theEnd * * @return void */ private static function finishCurrentSpan(string &$result, bool $theEnd = false): void { $textSpan = substr($result, self::$posSpanStart); $result = substr($result, 0, self::$posSpanStart); // Get rid of empty spans, so that our check for presence of RTL will work $result = str_replace([ self::START_LTR . self::END_LTR, self::START_RTL . self::END_RTL, ], '', $result); // Look for numeric strings that are times (hh:mm:ss). These have to be separated from surrounding numbers. $tempResult = ''; while ($textSpan !== '') { $posColon = strpos($textSpan, ':'); if ($posColon === false) { break; } // No more possible time strings $posLRE = strpos($textSpan, self::UTF8_LRE); if ($posLRE === false) { break; } // No more numeric strings $posPDF = strpos($textSpan, self::UTF8_PDF, $posLRE); if ($posPDF === false) { break; } // No more numeric strings $tempResult .= substr($textSpan, 0, $posLRE + 3); // Copy everything preceding the numeric string $numericString = substr($textSpan, $posLRE + 3, $posPDF - $posLRE); // Separate the entire numeric string $textSpan = substr($textSpan, $posPDF + 3); $posColon = strpos($numericString, ':'); if ($posColon === false) { // Nothing that looks like a time here $tempResult .= $numericString; continue; } $posBlank = strpos($numericString . ' ', ' '); $posNbsp = strpos($numericString . ' ', ' '); if ($posBlank < $posNbsp) { $posSeparator = $posBlank; $lengthSeparator = 1; } else { $posSeparator = $posNbsp; $lengthSeparator = 6; } if ($posColon > $posSeparator) { // We have a time string preceded by a blank: Exclude that blank from the numeric string $tempResult .= substr($numericString, 0, $posSeparator); $tempResult .= self::UTF8_PDF; $tempResult .= substr($numericString, $posSeparator, $lengthSeparator); $tempResult .= self::UTF8_LRE; $numericString = substr($numericString, $posSeparator + $lengthSeparator); } $posBlank = strpos($numericString, ' '); $posNbsp = strpos($numericString, ' '); if ($posBlank === false && $posNbsp === false) { // The time string isn't followed by a blank $textSpan = $numericString . $textSpan; continue; } // We have a time string followed by a blank: Exclude that blank from the numeric string if ($posBlank === false) { $posSeparator = $posNbsp; $lengthSeparator = 6; } elseif ($posNbsp === false) { $posSeparator = $posBlank; $lengthSeparator = 1; } elseif ($posBlank < $posNbsp) { $posSeparator = $posBlank; $lengthSeparator = 1; } else { $posSeparator = $posNbsp; $lengthSeparator = 6; } $tempResult .= substr($numericString, 0, $posSeparator); $tempResult .= self::UTF8_PDF; $tempResult .= substr($numericString, $posSeparator, $lengthSeparator); $posSeparator += $lengthSeparator; $numericString = substr($numericString, $posSeparator); $textSpan = self::UTF8_LRE . $numericString . $textSpan; } $textSpan = $tempResult . $textSpan; $trailingBlanks = ''; $trailingBreaks = ''; /* ****************************** LTR text handling ******************************** */ if (self::$currentState === 'LTR') { // Move trailing numeric strings to the following RTL text. Include any blanks preceding or following the numeric text too. if (I18N::direction() === 'rtl' && self::$previousState === 'RTL' && !$theEnd) { $trailingString = ''; $savedSpan = $textSpan; while ($textSpan !== '') { // Look for trailing spaces and tentatively move them if (substr($textSpan, -1) === ' ') { $trailingString = ' ' . $trailingString; $textSpan = substr($textSpan, 0, -1); continue; } if (substr($textSpan, -6) === ' ') { $trailingString = ' ' . $trailingString; $textSpan = substr($textSpan, 0, -1); continue; } if (substr($textSpan, -3) !== self::UTF8_PDF) { // There is no trailing numeric string $textSpan = $savedSpan; break; } // We have a numeric string $posStartNumber = strrpos($textSpan, self::UTF8_LRE); if ($posStartNumber === false) { $posStartNumber = 0; } $trailingString = substr($textSpan, $posStartNumber) . $trailingString; $textSpan = substr($textSpan, 0, $posStartNumber); // Look for more spaces and move them too while ($textSpan !== '') { if (substr($textSpan, -1) === ' ') { $trailingString = ' ' . $trailingString; $textSpan = substr($textSpan, 0, -1); continue; } if (substr($textSpan, -6) === ' ') { $trailingString = ' ' . $trailingString; $textSpan = substr($textSpan, 0, -1); continue; } break; } self::$waitingText = $trailingString . self::$waitingText; break; } } $savedSpan = $textSpan; // Move any trailing
, optionally preceded or followed by blanks, outside this LTR span while ($textSpan !== '') { if (substr($textSpan, -1) === ' ') { $trailingBlanks = ' ' . $trailingBlanks; $textSpan = substr($textSpan, 0, -1); continue; } if (substr('......' . $textSpan, -6) === ' ') { $trailingBlanks = ' ' . $trailingBlanks; $textSpan = substr($textSpan, 0, -6); continue; } break; } while (substr($textSpan, -7) === '') { $trailingBreaks = '
' . $trailingBreaks; // Plain
because it’s outside a span $textSpan = substr($textSpan, 0, -7); } if ($trailingBreaks !== '') { while ($textSpan !== '') { if (substr($textSpan, -1) === ' ') { $trailingBreaks = ' ' . $trailingBreaks; $textSpan = substr($textSpan, 0, -1); continue; } if (substr($textSpan, -6) === ' ') { $trailingBreaks = ' ' . $trailingBreaks; $textSpan = substr($textSpan, 0, -6); continue; } break; } self::$waitingText = $trailingBlanks . self::$waitingText; // Put those trailing blanks inside the following span } else { $textSpan = $savedSpan; } $trailingBlanks = ''; $trailingPunctuation = ''; $trailingID = ''; $trailingSeparator = ''; $leadingSeparator = ''; while (I18N::direction() === 'rtl') { if (str_contains($result, self::START_RTL)) { // Remove trailing blanks for inclusion in a separate LTR span while ($textSpan !== '') { if (substr($textSpan, -1) === ' ') { $trailingBlanks = ' ' . $trailingBlanks; $textSpan = substr($textSpan, 0, -1); continue; } if (substr($textSpan, -6) === ' ') { $trailingBlanks = ' ' . $trailingBlanks; $textSpan = substr($textSpan, 0, -1); continue; } break; } // Remove trailing punctuation for inclusion in a separate LTR span if ($textSpan === '') { $trailingChar = "\n"; } else { $trailingChar = substr($textSpan, -1); } if (str_contains(self::PUNCTUATION, $trailingChar)) { $trailingPunctuation = $trailingChar; $textSpan = substr($textSpan, 0, -1); } } // Remove trailing ID numbers that look like "(xnnn)" for inclusion in a separate LTR span while (true) { if (substr($textSpan, -1) !== ')') { break; } // There is no trailing ')' $posLeftParen = strrpos($textSpan, '('); if ($posLeftParen === false) { break; } // There is no leading '(' $temp = self::stripLrmRlm(substr($textSpan, $posLeftParen)); // Get rid of UTF8 control codes // If the parenthesized text doesn't look like an ID number, // we don't want to touch it. // This check won’t work if somebody uses ID numbers with an unusual format. $offset = 1; $charArray = self::getChar($temp, $offset); // Get 1st character of parenthesized text if (str_contains(self::NUMBERS, $charArray['letter'])) { break; } $offset += $charArray['length']; // Point at 2nd character of parenthesized text if (!str_contains(self::NUMBERS, substr($temp, $offset, 1))) { break; } // 1st character of parenthesized text is alpha, 2nd character is a digit; last has to be a digit too if (!str_contains(self::NUMBERS, substr($temp, -2, 1))) { break; } $trailingID = substr($textSpan, $posLeftParen); $textSpan = substr($textSpan, 0, $posLeftParen); break; } // Look for " - " or blank preceding the ID number and remove it for inclusion in a separate LTR span if ($trailingID !== '') { while ($textSpan !== '') { if (substr($textSpan, -1) === ' ') { $trailingSeparator = ' ' . $trailingSeparator; $textSpan = substr($textSpan, 0, -1); continue; } if (substr($textSpan, -6) === ' ') { $trailingSeparator = ' ' . $trailingSeparator; $textSpan = substr($textSpan, 0, -6); continue; } if (substr($textSpan, -1) === '-') { $trailingSeparator = '-' . $trailingSeparator; $textSpan = substr($textSpan, 0, -1); continue; } break; } } // Look for " - " preceding the text and remove it for inclusion in a separate LTR span $foundSeparator = false; $savedSpan = $textSpan; while ($textSpan !== '') { if (substr($textSpan, 0, 1) === ' ') { $leadingSeparator = ' ' . $leadingSeparator; $textSpan = substr($textSpan, 1); continue; } if (substr($textSpan, 0, 6) === ' ') { $leadingSeparator = ' ' . $leadingSeparator; $textSpan = substr($textSpan, 6); continue; } if (substr($textSpan, 0, 1) === '-') { $leadingSeparator = '-' . $leadingSeparator; $textSpan = substr($textSpan, 1); $foundSeparator = true; continue; } break; } if (!$foundSeparator) { $textSpan = $savedSpan; $leadingSeparator = ''; } break; } // We're done: finish the span $textSpan = self::starredName($textSpan, 'LTR'); // Wrap starred name in and tags while (true) { // Remove blanks that precede if (str_contains($textSpan, ' ')) { $textSpan = str_replace(' ', '', $textSpan); continue; } if (str_contains($textSpan, ' ')) { $textSpan = str_replace(' ', '', $textSpan); continue; } break; } if ($leadingSeparator !== '') { $result .= self::START_LTR . $leadingSeparator . self::END_LTR; } $result .= $textSpan . self::END_LTR; if ($trailingSeparator !== '') { $result .= self::START_LTR . $trailingSeparator . self::END_LTR; } if ($trailingID !== '') { $result .= self::START_LTR . $trailingID . self::END_LTR; } if ($trailingPunctuation !== '') { $result .= self::START_LTR . $trailingPunctuation . self::END_LTR; } if ($trailingBlanks !== '') { $result .= self::START_LTR . $trailingBlanks . self::END_LTR; } } /* ****************************** RTL text handling ******************************** */ if (self::$currentState === 'RTL') { $savedSpan = $textSpan; // Move any trailing
, optionally followed by blanks, outside this RTL span while ($textSpan !== '') { if (substr($textSpan, -1) === ' ') { $trailingBlanks = ' ' . $trailingBlanks; $textSpan = substr($textSpan, 0, -1); continue; } if (substr('......' . $textSpan, -6) === ' ') { $trailingBlanks = ' ' . $trailingBlanks; $textSpan = substr($textSpan, 0, -6); continue; } break; } while (substr($textSpan, -7) === '') { $trailingBreaks = '
' . $trailingBreaks; // Plain
because it’s outside a span $textSpan = substr($textSpan, 0, -7); } if ($trailingBreaks !== '') { self::$waitingText = $trailingBlanks . self::$waitingText; // Put those trailing blanks inside the following span } else { $textSpan = $savedSpan; } // Move trailing numeric strings to the following LTR text. Include any blanks preceding or following the numeric text too. if (!$theEnd && I18N::direction() !== 'rtl') { $trailingString = ''; $savedSpan = $textSpan; while ($textSpan !== '') { // Look for trailing spaces and tentatively move them if (substr($textSpan, -1) === ' ') { $trailingString = ' ' . $trailingString; $textSpan = substr($textSpan, 0, -1); continue; } if (substr($textSpan, -6) === ' ') { $trailingString = ' ' . $trailingString; $textSpan = substr($textSpan, 0, -1); continue; } if (substr($textSpan, -3) !== self::UTF8_PDF) { // There is no trailing numeric string $textSpan = $savedSpan; break; } // We have a numeric string $posStartNumber = strrpos($textSpan, self::UTF8_LRE); if ($posStartNumber === false) { $posStartNumber = 0; } $trailingString = substr($textSpan, $posStartNumber) . $trailingString; $textSpan = substr($textSpan, 0, $posStartNumber); // Look for more spaces and move them too while ($textSpan !== '') { if (substr($textSpan, -1) === ' ') { $trailingString = ' ' . $trailingString; $textSpan = substr($textSpan, 0, -1); continue; } if (substr($textSpan, -6) === ' ') { $trailingString = ' ' . $trailingString; $textSpan = substr($textSpan, 0, -1); continue; } break; } self::$waitingText = $trailingString . self::$waitingText; break; } } // Trailing " - " needs to be prefixed to the following span if (!$theEnd && substr('...' . $textSpan, -3) === ' - ') { $textSpan = substr($textSpan, 0, -3); self::$waitingText = ' - ' . self::$waitingText; } while (I18N::direction() === 'rtl') { // Look for " - " preceding and relocate it to the front of the string $posDashString = strpos($textSpan, ' - '); if ($posDashString === false) { break; } $posStringStart = strrpos(substr($textSpan, 0, $posDashString), ''); if ($posStringStart === false) { $posStringStart = 0; } else { $posStringStart += 9; } // Point to the first char following the last $textSpan = substr($textSpan, 0, $posStringStart) . ' - ' . substr($textSpan, $posStringStart, $posDashString - $posStringStart) . substr($textSpan, $posDashString + 3); } // Strip leading spaces from the RTL text $countLeadingSpaces = 0; while ($textSpan !== '') { if (substr($textSpan, 0, 1) === ' ') { $countLeadingSpaces++; $textSpan = substr($textSpan, 1); continue; } if (substr($textSpan, 0, 6) === ' ') { $countLeadingSpaces++; $textSpan = substr($textSpan, 6); continue; } break; } // Strip trailing spaces from the RTL text $countTrailingSpaces = 0; while ($textSpan !== '') { if (substr($textSpan, -1) === ' ') { $countTrailingSpaces++; $textSpan = substr($textSpan, 0, -1); continue; } if (substr($textSpan, -6) === ' ') { $countTrailingSpaces++; $textSpan = substr($textSpan, 0, -6); continue; } break; } // Look for trailing " -", reverse it, and relocate it to the front of the string if (substr($textSpan, -2) === ' -') { $posDashString = strlen($textSpan) - 2; $posStringStart = strrpos(substr($textSpan, 0, $posDashString), ''); if ($posStringStart === false) { $posStringStart = 0; } else { $posStringStart += 9; } // Point to the first char following the last $textSpan = substr($textSpan, 0, $posStringStart) . '- ' . substr($textSpan, $posStringStart, $posDashString - $posStringStart) . substr($textSpan, $posDashString + 2); } if ($countLeadingSpaces !== 0) { $newLength = strlen($textSpan) + $countLeadingSpaces; $textSpan = str_pad($textSpan, $newLength, ' ', I18N::direction() === 'rtl' ? STR_PAD_LEFT : STR_PAD_RIGHT); } if ($countTrailingSpaces !== 0) { if (I18N::direction() === 'ltr') { if ($trailingBreaks === '') { // Move trailing RTL spaces to front of following LTR span $newLength = strlen(self::$waitingText) + $countTrailingSpaces; self::$waitingText = str_pad(self::$waitingText, $newLength, ' ', STR_PAD_LEFT); } } else { $newLength = strlen($textSpan) + $countTrailingSpaces; $textSpan = str_pad($textSpan, $newLength); } } // We're done: finish the span $textSpan = self::starredName($textSpan, 'RTL'); // Wrap starred name in and tags $result .= $textSpan . self::END_RTL; } if (self::$currentState !== 'LTR' && self::$currentState !== 'RTL') { $result .= $textSpan; } $result .= $trailingBreaks; // Get rid of any waiting
} }