layout/generic/nsTextRunTransformations.cpp

   1 /* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*-
   2  * This Source Code Form is subject to the terms of the Mozilla Public
   3  * License, v. 2.0. If a copy of the MPL was not distributed with this
   4  * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
   5
   6 #include "nsTextRunTransformations.h"
   7
   8 #include "mozilla/MemoryReporting.h"
   9
  10 #include "nsGkAtoms.h"
  11 #include "nsStyleConsts.h"
  12 #include "nsStyleContext.h"
  13 #include "nsUnicharUtils.h"
  14 #include "nsUnicodeProperties.h"
  15 #include "nsSpecialCasingData.h"
  16 #include "mozilla/gfx/2D.h"
  17 #include "nsTextFrameUtils.h"
  18 #include "nsIPersistentProperties2.h"
  19 #include "nsNetUtil.h"
  20 #include "GreekCasing.h"
  21 #include "IrishCasing.h"
  22
  23 // Unicode characters needing special casing treatment in tr/az languages
  24 #define LATIN_CAPITAL_LETTER_I_WITH_DOT_ABOVE  0x0130
  25 #define LATIN_SMALL_LETTER_DOTLESS_I           0x0131
  26
  27 // Greek sigma needs custom handling for the lowercase transform; for details
  28 // see comments under "case NS_STYLE_TEXT_TRANSFORM_LOWERCASE" within
  29 // nsCaseTransformTextRunFactory::RebuildTextRun(), and bug 740120.
  30 #define GREEK_CAPITAL_LETTER_SIGMA             0x03A3
  31 #define GREEK_SMALL_LETTER_FINAL_SIGMA         0x03C2
  32 #define GREEK_SMALL_LETTER_SIGMA               0x03C3
  33
  34 nsTransformedTextRun *
  35 nsTransformedTextRun::Create(const gfxTextRunFactory::Parameters* aParams,
  36                              nsTransformingTextRunFactory* aFactory,
  37                              gfxFontGroup* aFontGroup,
  38                              const char16_t* aString, uint32_t aLength,
  39                              const uint32_t aFlags, nsStyleContext** aStyles,
  40                              bool aOwnsFactory)
  41 {
  42   NS_ASSERTION(!(aFlags & gfxTextRunFactory::TEXT_IS_8BIT),
  43                "didn't expect text to be marked as 8-bit here");
  44
  45   void *storage = AllocateStorageForTextRun(sizeof(nsTransformedTextRun), aLength);
  46   if (!storage) {
  47     return nullptr;
  48   }
  49
  50   return new (storage) nsTransformedTextRun(aParams, aFactory, aFontGroup,
  51                                             aString, aLength,
  52                                             aFlags, aStyles, aOwnsFactory);
  53 }
  54
  55 void
  56 nsTransformedTextRun::SetCapitalization(uint32_t aStart, uint32_t aLength,
  57                                         bool* aCapitalization,
  58                                         gfxContext* aRefContext)
  59 {
  60   if (mCapitalize.IsEmpty()) {
  61     if (!mCapitalize.AppendElements(GetLength()))
  62       return;
  63     memset(mCapitalize.Elements(), 0, GetLength()*sizeof(bool));
  64   }
  65   memcpy(mCapitalize.Elements() + aStart, aCapitalization, aLength*sizeof(bool));
  66   mNeedsRebuild = true;
  67 }
  68
  69 bool
  70 nsTransformedTextRun::SetPotentialLineBreaks(uint32_t aStart, uint32_t aLength,
  71                                              uint8_t* aBreakBefore,
  72                                              gfxContext* aRefContext)
  73 {
  74   bool changed = gfxTextRun::SetPotentialLineBreaks(aStart, aLength,
  75       aBreakBefore, aRefContext);
  76   if (changed) {
  77     mNeedsRebuild = true;
  78   }
  79   return changed;
  80 }
  81
  82 size_t
  83 nsTransformedTextRun::SizeOfExcludingThis(mozilla::MallocSizeOf aMallocSizeOf)
  84 {
  85   size_t total = gfxTextRun::SizeOfExcludingThis(aMallocSizeOf);
  86   total += mStyles.SizeOfExcludingThis(aMallocSizeOf);
  87   total += mCapitalize.SizeOfExcludingThis(aMallocSizeOf);
  88   if (mOwnsFactory) {
  89     total += aMallocSizeOf(mFactory);
  90   }
  91   return total;
  92 }
  93
  94 size_t
  95 nsTransformedTextRun::SizeOfIncludingThis(mozilla::MallocSizeOf aMallocSizeOf)
  96 {
  97   return aMallocSizeOf(this) + SizeOfExcludingThis(aMallocSizeOf);
  98 }
  99
 100 nsTransformedTextRun*
 101 nsTransformingTextRunFactory::MakeTextRun(const char16_t* aString, uint32_t aLength,
 102                                           const gfxTextRunFactory::Parameters* aParams,
 103                                           gfxFontGroup* aFontGroup, uint32_t aFlags,
 104                                           nsStyleContext** aStyles, bool aOwnsFactory)
 105 {
 106   return nsTransformedTextRun::Create(aParams, this, aFontGroup,
 107                                       aString, aLength, aFlags, aStyles, aOwnsFactory);
 108 }
 109
 110 nsTransformedTextRun*
 111 nsTransformingTextRunFactory::MakeTextRun(const uint8_t* aString, uint32_t aLength,
 112                                           const gfxTextRunFactory::Parameters* aParams,
 113                                           gfxFontGroup* aFontGroup, uint32_t aFlags,
 114                                           nsStyleContext** aStyles, bool aOwnsFactory)
 115 {
 116   // We'll only have a Unicode code path to minimize the amount of code needed
 117   // for these rarely used features
 118   NS_ConvertASCIItoUTF16 unicodeString(reinterpret_cast<const char*>(aString), aLength);
 119   return MakeTextRun(unicodeString.get(), aLength, aParams, aFontGroup,
 120                      aFlags & ~(gfxFontGroup::TEXT_IS_PERSISTENT | gfxFontGroup::TEXT_IS_8BIT),
 121                      aStyles, aOwnsFactory);
 122 }
 123
 124 void
 125 MergeCharactersInTextRun(gfxTextRun* aDest, gfxTextRun* aSrc,
 126                          const bool* aCharsToMerge, const bool* aDeletedChars)
 127 {
 128   aDest->ResetGlyphRuns();
 129
 130   gfxTextRun::GlyphRunIterator iter(aSrc, 0, aSrc->GetLength());
 131   uint32_t offset = 0;
 132   nsAutoTArray<gfxTextRun::DetailedGlyph,2> glyphs;
 133   while (iter.NextRun()) {
 134     gfxTextRun::GlyphRun* run = iter.GetGlyphRun();
 135     nsresult rv = aDest->AddGlyphRun(run->mFont, run->mMatchType,
 136                                      offset, false);
 137     if (NS_FAILED(rv))
 138       return;
 139
 140     bool anyMissing = false;
 141     uint32_t mergeRunStart = iter.GetStringStart();
 142     const gfxTextRun::CompressedGlyph *srcGlyphs = aSrc->GetCharacterGlyphs();
 143     gfxTextRun::CompressedGlyph mergedGlyph = srcGlyphs[mergeRunStart];
 144     uint32_t stringEnd = iter.GetStringEnd();
 145     for (uint32_t k = iter.GetStringStart(); k < stringEnd; ++k) {
 146       const gfxTextRun::CompressedGlyph g = srcGlyphs[k];
 147       if (g.IsSimpleGlyph()) {
 148         if (!anyMissing) {
 149           gfxTextRun::DetailedGlyph details;
 150           details.mGlyphID = g.GetSimpleGlyph();
 151           details.mAdvance = g.GetSimpleAdvance();
 152           details.mXOffset = 0;
 153           details.mYOffset = 0;
 154           glyphs.AppendElement(details);
 155         }
 156       } else {
 157         if (g.IsMissing()) {
 158           anyMissing = true;
 159           glyphs.Clear();
 160         }
 161         if (g.GetGlyphCount() > 0) {
 162           glyphs.AppendElements(aSrc->GetDetailedGlyphs(k), g.GetGlyphCount());
 163         }
 164       }
 165
 166       if (k + 1 < iter.GetStringEnd() && aCharsToMerge[k + 1]) {
 167         // next char is supposed to merge with current, so loop without
 168         // writing current merged glyph to the destination
 169         continue;
 170       }
 171
 172       // If the start of the merge run is actually a character that should
 173       // have been merged with the previous character (this can happen
 174       // if there's a font change in the middle of a case-mapped character,
 175       // that decomposed into a sequence of base+diacritics, for example),
 176       // just discard the entire merge run. See comment at start of this
 177       // function.
 178       NS_WARN_IF_FALSE(!aCharsToMerge[mergeRunStart],
 179                        "unable to merge across a glyph run boundary, "
 180                        "glyph(s) discarded");
 181       if (!aCharsToMerge[mergeRunStart]) {
 182         if (anyMissing) {
 183           mergedGlyph.SetMissing(glyphs.Length());
 184         } else {
 185           mergedGlyph.SetComplex(mergedGlyph.IsClusterStart(),
 186                                  mergedGlyph.IsLigatureGroupStart(),
 187                                  glyphs.Length());
 188         }
 189         aDest->SetGlyphs(offset, mergedGlyph, glyphs.Elements());
 190         ++offset;
 191
 192         while (offset < aDest->GetLength() && aDeletedChars[offset]) {
 193           aDest->SetGlyphs(offset++, gfxTextRun::CompressedGlyph(), nullptr);
 194         }
 195       }
 196
 197       glyphs.Clear();
 198       anyMissing = false;
 199       mergeRunStart = k + 1;
 200       if (mergeRunStart < stringEnd) {
 201         mergedGlyph = srcGlyphs[mergeRunStart];
 202       }
 203     }
 204     NS_ASSERTION(glyphs.Length() == 0,
 205                  "Leftover glyphs, don't request merging of the last character with its next!");
 206   }
 207   NS_ASSERTION(offset == aDest->GetLength(), "Bad offset calculations");
 208 }
 209
 210 gfxTextRunFactory::Parameters
 211 GetParametersForInner(nsTransformedTextRun* aTextRun, uint32_t* aFlags,
 212     gfxContext* aRefContext)
 213 {
 214   gfxTextRunFactory::Parameters params =
 215     { aRefContext, nullptr, nullptr,
 216       nullptr, 0, aTextRun->GetAppUnitsPerDevUnit()
 217     };
 218   *aFlags = aTextRun->GetFlags() & ~gfxFontGroup::TEXT_IS_PERSISTENT;
 219   return params;
 220 }
 221
 222 // Some languages have special casing conventions that differ from the
 223 // default Unicode mappings.
 224 // The enum values here are named for well-known exemplar languages that
 225 // exhibit the behavior in question; multiple lang tags may map to the
 226 // same setting here, if the behavior is shared by other languages.
 227 enum LanguageSpecificCasingBehavior {
 228   eLSCB_None,    // default non-lang-specific behavior
 229   eLSCB_Dutch,   // treat "ij" digraph as a unit for capitalization
 230   eLSCB_Greek,   // strip accent when uppercasing Greek vowels
 231   eLSCB_Irish,   // keep prefix letters as lowercase when uppercasing Irish
 232   eLSCB_Turkish  // preserve dotted/dotless-i distinction in uppercase
 233 };
 234
 235 static LanguageSpecificCasingBehavior
 236 GetCasingFor(const nsIAtom* aLang)
 237 {
 238   if (!aLang) {
 239       return eLSCB_None;
 240   }
 241   if (aLang == nsGkAtoms::tr ||
 242       aLang == nsGkAtoms::az ||
 243       aLang == nsGkAtoms::ba ||
 244       aLang == nsGkAtoms::crh ||
 245       aLang == nsGkAtoms::tt) {
 246     return eLSCB_Turkish;
 247   }
 248   if (aLang == nsGkAtoms::nl) {
 249     return eLSCB_Dutch;
 250   }
 251   if (aLang == nsGkAtoms::el) {
 252     return eLSCB_Greek;
 253   }
 254   if (aLang == nsGkAtoms::ga) {
 255     return eLSCB_Irish;
 256   }
 257
 258   // Is there a region subtag we should ignore?
 259   nsAtomString langStr(const_cast<nsIAtom*>(aLang));
 260   int index = langStr.FindChar('-');
 261   if (index > 0) {
 262     langStr.Truncate(index);
 263     nsCOMPtr<nsIAtom> truncatedLang = do_GetAtom(langStr);
 264     return GetCasingFor(truncatedLang);
 265   }
 266
 267   return eLSCB_None;
 268 }
 269
 270 bool
 271 nsCaseTransformTextRunFactory::TransformString(
 272     const nsAString& aString,
 273     nsString& aConvertedString,
 274     bool aAllUppercase,
 275     const nsIAtom* aLanguage,
 276     nsTArray<bool>& aCharsToMergeArray,
 277     nsTArray<bool>& aDeletedCharsArray,
 278     nsTransformedTextRun* aTextRun,
 279     nsTArray<uint8_t>* aCanBreakBeforeArray,
 280     nsTArray<nsStyleContext*>* aStyleArray)
 281 {
 282   NS_PRECONDITION(!aTextRun || (aCanBreakBeforeArray && aStyleArray),
 283                   "either none or all three optional parameters required");
 284
 285   uint32_t length = aString.Length();
 286   const char16_t* str = aString.BeginReading();
 287
 288   bool mergeNeeded = false;
 289
 290   bool capitalizeDutchIJ = false;
 291   bool prevIsLetter = false;
 292   bool ntPrefix = false; // true immediately after a word-initial 'n' or 't'
 293                          // when doing Irish lowercasing
 294   uint32_t sigmaIndex = uint32_t(-1);
 295   nsIUGenCategory::nsUGenCategory cat;
 296
 297   uint8_t style = aAllUppercase ? NS_STYLE_TEXT_TRANSFORM_UPPERCASE : 0;
 298   const nsIAtom* lang = aLanguage;
 299
 300   LanguageSpecificCasingBehavior languageSpecificCasing = GetCasingFor(lang);
 301   mozilla::GreekCasing::State greekState;
 302   mozilla::IrishCasing::State irishState;
 303   uint32_t irishMark = uint32_t(-1); // location of possible prefix letter(s)
 304
 305   for (uint32_t i = 0; i < length; ++i) {
 306     uint32_t ch = str[i];
 307
 308     nsStyleContext* styleContext;
 309     if (aTextRun) {
 310       styleContext = aTextRun->mStyles[i];
 311       style = aAllUppercase ? NS_STYLE_TEXT_TRANSFORM_UPPERCASE :
 312         styleContext->StyleText()->mTextTransform;
 313
 314       if (lang != styleContext->StyleFont()->mLanguage) {
 315         lang = styleContext->StyleFont()->mLanguage;
 316         languageSpecificCasing = GetCasingFor(lang);
 317         greekState.Reset();
 318         irishState.Reset();
 319         irishMark = uint32_t(-1);
 320       }
 321     }
 322
 323     int extraChars = 0;
 324     const mozilla::unicode::MultiCharMapping *mcm;
 325     bool inhibitBreakBefore = false; // have we just deleted preceding hyphen?
 326
 327     if (NS_IS_HIGH_SURROGATE(ch) && i < length - 1 &&
 328         NS_IS_LOW_SURROGATE(str[i + 1])) {
 329       ch = SURROGATE_TO_UCS4(ch, str[i + 1]);
 330     }
 331
 332     switch (style) {
 333     case NS_STYLE_TEXT_TRANSFORM_LOWERCASE:
 334       if (languageSpecificCasing == eLSCB_Turkish) {
 335         if (ch == 'I') {
 336           ch = LATIN_SMALL_LETTER_DOTLESS_I;
 337           prevIsLetter = true;
 338           sigmaIndex = uint32_t(-1);
 339           break;
 340         }
 341         if (ch == LATIN_CAPITAL_LETTER_I_WITH_DOT_ABOVE) {
 342           ch = 'i';
 343           prevIsLetter = true;
 344           sigmaIndex = uint32_t(-1);
 345           break;
 346         }
 347       }
 348
 349       cat = mozilla::unicode::GetGenCategory(ch);
 350
 351       if (languageSpecificCasing == eLSCB_Irish &&
 352           cat == nsIUGenCategory::kLetter) {
 353         // See bug 1018805 for Irish lowercasing requirements
 354         if (!prevIsLetter && (ch == 'n' || ch == 't')) {
 355           ntPrefix = true;
 356         } else {
 357           if (ntPrefix && mozilla::IrishCasing::IsUpperVowel(ch)) {
 358             aConvertedString.Append('-');
 359             ++extraChars;
 360           }
 361           ntPrefix = false;
 362         }
 363       } else {
 364         ntPrefix = false;
 365       }
 366
 367       // Special lowercasing behavior for Greek Sigma: note that this is listed
 368       // as context-sensitive in Unicode's SpecialCasing.txt, but is *not* a
 369       // language-specific mapping; it applies regardless of the language of
 370       // the element.
 371       //
 372       // The lowercase mapping for CAPITAL SIGMA should be to SMALL SIGMA (i.e.
 373       // the non-final form) whenever there is a following letter, or when the
 374       // CAPITAL SIGMA occurs in isolation (neither preceded nor followed by a
 375       // LETTER); and to FINAL SIGMA when it is preceded by another letter but
 376       // not followed by one.
 377       //
 378       // To implement the context-sensitive nature of this mapping, we keep
 379       // track of whether the previous character was a letter. If not, CAPITAL
 380       // SIGMA will map directly to SMALL SIGMA. If the previous character
 381       // was a letter, CAPITAL SIGMA maps to FINAL SIGMA and we record the
 382       // position in the converted string; if we then encounter another letter,
 383       // that FINAL SIGMA is replaced with a standard SMALL SIGMA.
 384
 385       // If sigmaIndex is not -1, it marks where we have provisionally mapped
 386       // a CAPITAL SIGMA to FINAL SIGMA; if we now find another letter, we
 387       // need to change it to SMALL SIGMA.
 388       if (sigmaIndex != uint32_t(-1)) {
 389         if (cat == nsIUGenCategory::kLetter) {
 390           aConvertedString.SetCharAt(GREEK_SMALL_LETTER_SIGMA, sigmaIndex);
 391         }
 392       }
 393
 394       if (ch == GREEK_CAPITAL_LETTER_SIGMA) {
 395         // If preceding char was a letter, map to FINAL instead of SMALL,
 396         // and note where it occurred by setting sigmaIndex; we'll change it
 397         // to standard SMALL SIGMA later if another letter follows
 398         if (prevIsLetter) {
 399           ch = GREEK_SMALL_LETTER_FINAL_SIGMA;
 400           sigmaIndex = aConvertedString.Length();
 401         } else {
 402           // CAPITAL SIGMA not preceded by a letter is unconditionally mapped
 403           // to SMALL SIGMA
 404           ch = GREEK_SMALL_LETTER_SIGMA;
 405           sigmaIndex = uint32_t(-1);
 406         }
 407         prevIsLetter = true;
 408         break;
 409       }
 410
 411       // ignore diacritics for the purpose of contextual sigma mapping;
 412       // otherwise, reset prevIsLetter appropriately and clear the
 413       // sigmaIndex marker
 414       if (cat != nsIUGenCategory::kMark) {
 415         prevIsLetter = (cat == nsIUGenCategory::kLetter);
 416         sigmaIndex = uint32_t(-1);
 417       }
 418
 419       mcm = mozilla::unicode::SpecialLower(ch);
 420       if (mcm) {
 421         int j = 0;
 422         while (j < 2 && mcm->mMappedChars[j + 1]) {
 423           aConvertedString.Append(mcm->mMappedChars[j]);
 424           ++extraChars;
 425           ++j;
 426         }
 427         ch = mcm->mMappedChars[j];
 428         break;
 429       }
 430
 431       ch = ToLowerCase(ch);
 432       break;
 433
 434     case NS_STYLE_TEXT_TRANSFORM_UPPERCASE:
 435       if (languageSpecificCasing == eLSCB_Turkish && ch == 'i') {
 436         ch = LATIN_CAPITAL_LETTER_I_WITH_DOT_ABOVE;
 437         break;
 438       }
 439
 440       if (languageSpecificCasing == eLSCB_Greek) {
 441         ch = mozilla::GreekCasing::UpperCase(ch, greekState);
 442         break;
 443       }
 444
 445       if (languageSpecificCasing == eLSCB_Irish) {
 446         bool mark;
 447         uint8_t action;
 448         ch = mozilla::IrishCasing::UpperCase(ch, irishState, mark, action);
 449         if (mark) {
 450           irishMark = aConvertedString.Length();
 451           break;
 452         } else if (action) {
 453           nsString& str = aConvertedString; // shorthand
 454           switch (action) {
 455           case 1:
 456             // lowercase a single prefix letter
 457             NS_ASSERTION(str.Length() > 0 && irishMark < str.Length(),
 458                          "bad irishMark!");
 459             str.SetCharAt(ToLowerCase(str[irishMark]), irishMark);
 460             irishMark = uint32_t(-1);
 461             break;
 462           case 2:
 463             // lowercase two prefix letters (immediately before current pos)
 464             NS_ASSERTION(str.Length() >= 2 && irishMark == str.Length() - 2,
 465                          "bad irishMark!");
 466             str.SetCharAt(ToLowerCase(str[irishMark]), irishMark);
 467             str.SetCharAt(ToLowerCase(str[irishMark + 1]), irishMark + 1);
 468             irishMark = uint32_t(-1);
 469             break;
 470           case 3:
 471             // lowercase one prefix letter, and delete following hyphen
 472             // (which must be the immediately-preceding char)
 473             NS_ASSERTION(str.Length() >= 2 && irishMark == str.Length() - 2,
 474                          "bad irishMark!");
 475             str.Replace(irishMark, 2, ToLowerCase(str[irishMark]));
 476             aDeletedCharsArray[irishMark + 1] = true;
 477             // Remove the trailing entries (corresponding to the deleted hyphen)
 478             // from the auxiliary arrays.
 479             aCharsToMergeArray.SetLength(aCharsToMergeArray.Length() - 1);
 480             if (aTextRun) {
 481               aStyleArray->SetLength(aStyleArray->Length() - 1);
 482               aCanBreakBeforeArray->SetLength(aCanBreakBeforeArray->Length() - 1);
 483               inhibitBreakBefore = true;
 484             }
 485             mergeNeeded = true;
 486             irishMark = uint32_t(-1);
 487             break;
 488           }
 489           // ch has been set to the uppercase for current char;
 490           // No need to check for SpecialUpper here as none of the characters
 491           // that could trigger an Irish casing action have special mappings.
 492           break;
 493         }
 494         // If we didn't have any special action to perform, fall through
 495         // to check for special uppercase (ß)
 496       }
 497
 498       mcm = mozilla::unicode::SpecialUpper(ch);
 499       if (mcm) {
 500         int j = 0;
 501         while (j < 2 && mcm->mMappedChars[j + 1]) {
 502           aConvertedString.Append(mcm->mMappedChars[j]);
 503           ++extraChars;
 504           ++j;
 505         }
 506         ch = mcm->mMappedChars[j];
 507         break;
 508       }
 509
 510       ch = ToUpperCase(ch);
 511       break;
 512
 513     case NS_STYLE_TEXT_TRANSFORM_CAPITALIZE:
 514       if (aTextRun) {
 515         if (capitalizeDutchIJ && ch == 'j') {
 516           ch = 'J';
 517           capitalizeDutchIJ = false;
 518           break;
 519         }
 520         capitalizeDutchIJ = false;
 521         if (i < aTextRun->mCapitalize.Length() && aTextRun->mCapitalize[i]) {
 522           if (languageSpecificCasing == eLSCB_Turkish && ch == 'i') {
 523             ch = LATIN_CAPITAL_LETTER_I_WITH_DOT_ABOVE;
 524             break;
 525           }
 526           if (languageSpecificCasing == eLSCB_Dutch && ch == 'i') {
 527             ch = 'I';
 528             capitalizeDutchIJ = true;
 529             break;
 530           }
 531
 532           mcm = mozilla::unicode::SpecialTitle(ch);
 533           if (mcm) {
 534             int j = 0;
 535             while (j < 2 && mcm->mMappedChars[j + 1]) {
 536               aConvertedString.Append(mcm->mMappedChars[j]);
 537               ++extraChars;
 538               ++j;
 539             }
 540             ch = mcm->mMappedChars[j];
 541             break;
 542           }
 543
 544           ch = ToTitleCase(ch);
 545         }
 546       }
 547       break;
 548
 549     case NS_STYLE_TEXT_TRANSFORM_FULLWIDTH:
 550       ch = mozilla::unicode::GetFullWidth(ch);
 551       break;
 552
 553     default:
 554       break;
 555     }
 556
 557     if (ch == uint32_t(-1)) {
 558       aDeletedCharsArray.AppendElement(true);
 559       mergeNeeded = true;
 560     } else {
 561       aDeletedCharsArray.AppendElement(false);
 562       aCharsToMergeArray.AppendElement(false);
 563       if (aTextRun) {
 564         aStyleArray->AppendElement(styleContext);
 565         aCanBreakBeforeArray->AppendElement(inhibitBreakBefore ? false :
 566                                             aTextRun->CanBreakLineBefore(i));
 567       }
 568
 569       if (IS_IN_BMP(ch)) {
 570         aConvertedString.Append(ch);
 571       } else {
 572         aConvertedString.Append(H_SURROGATE(ch));
 573         aConvertedString.Append(L_SURROGATE(ch));
 574         ++i;
 575         aDeletedCharsArray.AppendElement(true); // not exactly deleted, but the
 576                                                 // trailing surrogate is skipped
 577         ++extraChars;
 578       }
 579
 580       while (extraChars-- > 0) {
 581         mergeNeeded = true;
 582         aCharsToMergeArray.AppendElement(true);
 583         if (aTextRun) {
 584           aStyleArray->AppendElement(styleContext);
 585           aCanBreakBeforeArray->AppendElement(false);
 586         }
 587       }
 588     }
 589   }
 590
 591   return mergeNeeded;
 592 }
 593
 594 void
 595 nsCaseTransformTextRunFactory::RebuildTextRun(nsTransformedTextRun* aTextRun,
 596     gfxContext* aRefContext)
 597 {
 598   nsAutoString convertedString;
 599   nsAutoTArray<bool,50> charsToMergeArray;
 600   nsAutoTArray<bool,50> deletedCharsArray;
 601   nsAutoTArray<uint8_t,50> canBreakBeforeArray;
 602   nsAutoTArray<nsStyleContext*,50> styleArray;
 603
 604   bool mergeNeeded = TransformString(aTextRun->mString,
 605                                      convertedString,
 606                                      mAllUppercase,
 607                                      nullptr,
 608                                      charsToMergeArray,
 609                                      deletedCharsArray,
 610                                      aTextRun,
 611                                      &canBreakBeforeArray,
 612                                      &styleArray);
 613
 614   uint32_t flags;
 615   gfxTextRunFactory::Parameters innerParams =
 616       GetParametersForInner(aTextRun, &flags, aRefContext);
 617   gfxFontGroup* fontGroup = aTextRun->GetFontGroup();
 618
 619   nsAutoPtr<nsTransformedTextRun> transformedChild;
 620   nsAutoPtr<gfxTextRun> cachedChild;
 621   gfxTextRun* child;
 622
 623   if (mInnerTransformingTextRunFactory) {
 624     transformedChild = mInnerTransformingTextRunFactory->MakeTextRun(
 625         convertedString.BeginReading(), convertedString.Length(),
 626         &innerParams, fontGroup, flags, styleArray.Elements(), false);
 627     child = transformedChild.get();
 628   } else {
 629     cachedChild = fontGroup->MakeTextRun(
 630         convertedString.BeginReading(), convertedString.Length(),
 631         &innerParams, flags);
 632     child = cachedChild.get();
 633   }
 634   if (!child)
 635     return;
 636   // Copy potential linebreaks into child so they're preserved
 637   // (and also child will be shaped appropriately)
 638   NS_ASSERTION(convertedString.Length() == canBreakBeforeArray.Length(),
 639                "Dropped characters or break-before values somewhere!");
 640   child->SetPotentialLineBreaks(0, canBreakBeforeArray.Length(),
 641       canBreakBeforeArray.Elements(), aRefContext);
 642   if (transformedChild) {
 643     transformedChild->FinishSettingProperties(aRefContext);
 644   }
 645
 646   if (mergeNeeded) {
 647     // Now merge multiple characters into one multi-glyph character as required
 648     // and deal with skipping deleted accent chars
 649     NS_ASSERTION(charsToMergeArray.Length() == child->GetLength(),
 650                  "source length mismatch");
 651     NS_ASSERTION(deletedCharsArray.Length() == aTextRun->GetLength(),
 652                  "destination length mismatch");
 653     MergeCharactersInTextRun(aTextRun, child, charsToMergeArray.Elements(),
 654                              deletedCharsArray.Elements());
 655   } else {
 656     // No merging to do, so just copy; this produces a more optimized textrun.
 657     // We can't steal the data because the child may be cached and stealing
 658     // the data would break the cache.
 659     aTextRun->ResetGlyphRuns();
 660     aTextRun->CopyGlyphDataFrom(child, 0, child->GetLength(), 0);
 661   }
 662 }