/* * Uniscribe interface (& related classes) class implementation * * File: uspi.cpp * Create: Jan 10, 1998 * Author: Worachai Chaoweeraprasit (wchao) * * Copyright (c) 1998-2000, Microsoft Corporation. All rights reserved. */ #include "_common.h" #ifndef NOCOMPLEXSCRIPTS #include "_font.h" #include "_edit.h" #include "_frunptr.h" #include "_select.h" #include "_measure.h" #include "_uspi.h" CUniscribe* g_pusp = NULL; int g_cMaxScript = 0x100; // initial dummy script properties (= SCRIPT_UNDEFINED) static const SCRIPT_PROPERTIES g_propUndef = { LANG_NEUTRAL, FALSE, FALSE, FALSE, FALSE, 0 }; static const SCRIPT_PROPERTIES* g_pPropUndef[1] = { &g_propUndef }; CUniscribe::CUniscribe () { // Initialize digit substitution info ApplyDigitSubstitution(W32->GetDigitSubstitutionMode()); // Get maximum number of scripts supported ScriptGetProperties(NULL, &g_cMaxScript); } // Test the OS if it does any complex script. // REVIEW (keithcu) What if it only supports indic, but not the other ones? BOOL IsSupportedOS() { BOOL fSupport = !OnWin95FE(); int rguCodePage[] = {1255, 1256, 874}; BYTE rgbch[] = {0xe0, 0xd3, 0xa1}; WCHAR rgwch[] = {0x05d0, 0x0633, 0x0e01}; WCHAR wch; int i = 0; if (fSupport) { for (;i < 3; i++) { if (MBTWC(rguCodePage[i], 0, (LPCSTR)&rgbch[i], 1, (LPWSTR)&wch, 1, NULL) > 0 && wch == rgwch[i]) break; // support either Arabic, Hebrew or Thai } } return fSupport && i < 3; } // Prepare information for digit substitution // return: Native digit script (shapine engine) ID. // WORD CUniscribe::ApplyDigitSubstitution(BYTE bDigitSubstMode) { _wesNationalDigit = 0; // Remember national digits script ID if substitution mode is not None if (bDigitSubstMode != DIGITS_NOTIMPL && bDigitSubstMode != DIGITS_NONE) { WCHAR chZero = 0x0030; int cItems; SCRIPT_ITEM si[2]; SCRIPT_CONTROL sc = {0}; SCRIPT_STATE ss = {0}; // force national digit mode sc.uDefaultLanguage = GetNationalDigitLanguage(GetThreadLocale()); ss.fDigitSubstitute = TRUE; sc.fContextDigits = FALSE; if (SUCCEEDED(ScriptItemize(&chZero, 1, 2, &sc, &ss, (SCRIPT_ITEM*)&si, (int*)&cItems))) _wesNationalDigit = si[0].a.eScript; } return _wesNationalDigit; } // Some locales may have its own traditional (native) digit and national standard digit // recognised by a standard body and adopted by NLSAPI. The example is that Nepali(India) // has its own digit but the India standard uses Hindi digit as the national digit. // DWORD CUniscribe::GetNationalDigitLanguage(LCID lcid) { DWORD dwDigitLang = PRIMARYLANGID(LANGIDFROMLCID(lcid)); if (W32->OnWinNT5()) { WCHAR rgwstrDigit[20]; if (GetLocaleInfoW(lcid, LOCALE_SNATIVEDIGITS, rgwstrDigit, ARRAY_SIZE(rgwstrDigit))) { // Steal this from Uniscribe (build 0231) switch (rgwstrDigit[1]) { case 0x0661: dwDigitLang = LANG_ARABIC; break; case 0x06F1: dwDigitLang = LANG_FARSI; break; case 0x0e51: dwDigitLang = LANG_THAI; break; case 0x0967: dwDigitLang = LANG_HINDI; break; case 0x09e7: dwDigitLang = LANG_BENGALI; break; case 0x0a67: dwDigitLang = LANG_PUNJABI; break; case 0x0ae7: dwDigitLang = LANG_GUJARATI; break; case 0x0b67: dwDigitLang = LANG_ORIYA; break; case 0x0be7: dwDigitLang = LANG_TAMIL; break; case 0x0c67: dwDigitLang = LANG_TELUGU; break; case 0x0ce7: dwDigitLang = LANG_KANNADA; break; case 0x0d67: dwDigitLang = LANG_MALAYALAM; break; case 0x0f21: dwDigitLang = LANG_TIBETAN; break; case 0x0ed1: dwDigitLang = LANG_LAO; break; } } } return dwDigitLang; } CUniscribe::~CUniscribe () { if (_pFSM) { delete _pFSM; } } /***** High level services *****/ // Tokenize string and run Unicode Bidi algorithm if requested. // return : =<0 - error // >0 - number of complex script tokens // int CUniscribe::ItemizeString ( USP_CLIENT* pc, // in: Working structure WORD uInitLevel, // in: Initial Bidi level int* pcItems, // out: Count of items generated WCHAR* pwchString, // in: Input string int cch, // in: Number of character to itemize BOOL fUnicodeBiDi, // in: TRUE - Use UnicodeBidi WORD wLangId) // in: (optional) Dominant language preference { Assert (pc && pc->si && pcItems && pwchString && cch > 0 && cch <= pc->si->cchString); USP_CLIENT_SI* pc_si = pc->si; SCRIPT_ITEM* psi = pc_si->psi; SCRIPT_CONTROL sc = {0}; SCRIPT_STATE ss = {0}; SCRIPT_CONTROL* psc; SCRIPT_STATE* pss; HRESULT hr; int cItems = 0; if (fUnicodeBiDi) { psc = ≻ pss = &ss; if (wLangId == LANG_NEUTRAL) wLangId = PRIMARYLANGID(LANGIDFROMLCID(GetThreadLocale())); // (preitemize:) set up initial state psc->uDefaultLanguage = wLangId; // Classify + - and / in Win9x legacy manner psc->fLegacyBidiClass = TRUE; // For Arabic Office's compatibility. // We enable fArabicNumContext if the dominant language is Arabic. // if (psc->uDefaultLanguage == LANG_ARABIC) pss->fArabicNumContext = uInitLevel & 1; pss->uBidiLevel = uInitLevel; // Leave digit substitution to None since we do it ourself. // pss->fDigitSubstitute = FALSE; // psc->fContextDigits = FALSE; } else { psc = NULL; pss = NULL; } // begin real work hr = ScriptItemize(pwchString, cch, cch+1, psc, pss, psi, (int*)&cItems); return SUCCEEDED(hr) ? *pcItems = cItems : 0; } // Produce a shaped string (glyph array), taking care of font association and measurer's CF update // // Success can require 3 calls to Shape(): // 1. Returns E_PENDING (script cache doesn't contain the glyphing information) // 2. Return USP_E_SCRIPT_NOT_IN_FONT --the HFONT doesn't contain the script needed to do the glyphing // 3. Hopefully success, but may return again if the fallback font doesn't exist, but we quit anyway. int CUniscribe::ShapeString ( PLSRUN plsrun, // in: The first run to be shaped SCRIPT_ANALYSIS* psa, // in: Analysis of the run to be shaped CMeasurer* pme, // in: Measurer points to start cp of the run const WCHAR* pwch, // in: String to be shaped int cch, // in: Count of chars WORD*& pwgi, // out: Reference to glyph indices array WORD* pwlc, // out: Logical cluster array SCRIPT_VISATTR*& psva) // out: Reference to glyph's attribute array { AssertSz (plsrun && psa && pme && pwch, "ShapeString failed: Invalid params"); HRESULT hr = S_OK; HRESULT hrLastError = S_OK; HDC hdc = NULL; HFONT hOrgFont = NULL; int cGlyphs; int cchAdd = 0; CCcs *pccsSave = pme->Check_pccs(); int nAttempt = 8; // Maximum attempt to realloc glyph buffer to shape a string // make sure that we have proper font cache ready to use if (!pme->_pccs) return 0; if (psa->fNoGlyphIndex) // If no glyph processing, hdc must be around. hdc = PrepareShapeDC(plsrun, pme, E_PENDING, hOrgFont); // prepare glyph buffer if (!CacheAllocGlyphBuffers(cch, cGlyphs, pwgi, psva)) return 0; do { hr = ScriptShape(hdc, &pme->_pccs->_sc, pwch, cch, cGlyphs, psa, pwgi, pwlc, psva, &cGlyphs); if (SUCCEEDED(hr)) break; // Error handling... switch (hr) { case E_PENDING: case USP_E_SCRIPT_NOT_IN_FONT: if (hr == hrLastError) nAttempt = 0; // We encounter the same error twice. else { hdc = PrepareShapeDC(plsrun, pme, hr, hOrgFont); hrLastError = hr; } break; case E_OUTOFMEMORY: // (#6773)Indic shaping engine could produce glyphs more than we could hold. // cchAdd += 16; if (CacheAllocGlyphBuffers(cch + cchAdd, cGlyphs, pwgi, psva)) { nAttempt--; break; } default: nAttempt = 0; //AssertSz(FALSE, "Shaping fails with invalid error or we run out of memory."); break; } } while (nAttempt > 0); // restore hdc's original font if (hdc && hOrgFont) SelectObject(hdc, hOrgFont); if (pme->_pccs != pccsSave) plsrun->SetFallback(SUCCEEDED(hr)); return SUCCEEDED(hr) ? cGlyphs : 0; } // Place a string and take care of font association and measurer's CF update // // This is called right after ShapeString. int CUniscribe::PlaceString( PLSRUN plsrun, // in: The first run to be shaped SCRIPT_ANALYSIS* psa, // in: Analysis of the run to be shaped CMeasurer* pme, // in: Measurer points to start cp of the run const WORD* pcwgi, // in: Glyph indices array int cgi, // in: Count of input glyphs const SCRIPT_VISATTR* psva, // in: Glyph's attribute array int* pgdx, // out: Glyph's advanced width array GOFFSET* pgduv, // out: Glyph's offset array ABC* pABC) // out: Run's dimension { AssertSz (plsrun && psa && pme && pcwgi, "PlaceString failed: Invalid params"); HRESULT hr = S_OK; HRESULT hrLastError = S_OK; HDC hdc = NULL; HFONT hOrgFont = NULL; int nAttempt = 1; pme->Check_pccs(); pme->ApplyFontCache(plsrun->IsFallback(), plsrun->_a.eScript); // make sure that we have proper font cache ready to use if (!pme->_pccs) return 0; if (psa->fNoGlyphIndex) // If no glyph processing, hdc must be around. hdc = PrepareShapeDC(plsrun, pme, E_PENDING, hOrgFont); do { hr = ScriptPlace(hdc, &pme->_pccs->_sc, pcwgi, cgi, psva, psa, pgdx, pgduv, pABC); if (SUCCEEDED(hr)) break; // Error handling... switch (hr) { case E_PENDING: if (hr == hrLastError) nAttempt = 0; // We encounter the same error twice. else { hdc = PrepareShapeDC(plsrun, pme, hr, hOrgFont); hrLastError = hr; } break; default: nAttempt = 0; //AssertSz(FALSE, "Placing fails with invalid error."); break; } } while (nAttempt > 0); // restore hdc's original font if (hdc && hOrgFont) SelectObject(hdc, hOrgFont); return SUCCEEDED(hr) ? cgi : 0; } // Placing given string results in logical width array, // the result array would be used to record WMF metafile. // int CUniscribe::PlaceMetafileString ( PLSRUN plsrun, // in: The first run to be shaped CMeasurer* pme, // in: Measurer points to start cp of the run const WCHAR* pwch, // in: Input codepoint string int cch, // in: Character count PINT* ppiDx) // out: Pointer to logical widths array { AssertSz (pme && pwch && ppiDx, "PlaceMetafileString failed: Invalid params"); if (W32->OnWinNT4() || W32->OnWin9xThai()) { // MET NT40 has bug in lpdx justification so i doesnt playback the lpdx very nicely. // Thai Win9x simply cannot handle fancy lpdx values generated by Uniscribe. // We workaround both cases here by metafiling no lpdx and let the system reconstructs // it from scratch during playback time. // =FUTURE= If we do line justification. We need more sophisticated work here // basically to reconstruct the OS preferred type of lpdx. // *ppiDx = NULL; return cch; } HRESULT hr = E_FAIL; PUSP_CLIENT pc = NULL; int* piLogDx; // logical width array int* piVisDx; // visual width array GOFFSET* pGoffset; // glyph offset array WORD* pwgi; // glyph array SCRIPT_VISATTR* psva; // glyph properties array int cgi = 0; BYTE pbBufIn[MAX_CLIENT_BUF]; SCRIPT_ANALYSIS sa = plsrun->_a; BOOL fVisualGlyphDx = sa.fRTL && W32->OnWin9x() && W32->OnBiDiOS(); CreateClientStruc(pbBufIn, MAX_CLIENT_BUF, &pc, cch, cli_pcluster); if (!pc) return 0; PUSP_CLIENT_SSP pcssp = pc->ssp; if (fVisualGlyphDx) sa.fLogicalOrder = FALSE; // shaping result in visual order // Shape string if (cgi = ShapeString(plsrun, &sa, pme, pwch, (int)cch, pwgi, pcssp->pcluster, psva)) { // Get static buffer for logical and visual width arrays // if ( (piLogDx = GetWidthBuffer(cgi + cch)) && (pGoffset = GetGoffsetBuffer(cgi)) ) { piVisDx = &piLogDx[cch]; // then place it... if (cgi == PlaceString(plsrun, &sa, pme, pwgi, cgi, psva, piVisDx, pGoffset, NULL)) { if (fVisualGlyphDx) { // Workaround BiDi Win9x's lpdx handling // It assumes ExtTextOut's dx array is glyph width in visual order Assert (cgi <= cch); // glyph count never exceeds character count in BiDi CopyMemory (piLogDx, piVisDx, min(cgi, cch)*sizeof(int)); } else { // Map visual glyph widths to logical widths hr = ScriptGetLogicalWidths(&sa, cch, cgi, piVisDx, pcssp->pcluster, psva, piLogDx); } } // result *ppiDx = piLogDx; } } if (pc && pbBufIn != (BYTE*)pc) FreePv(pc); return SUCCEEDED(hr) ? cgi : 0; } /***** Helper functions *****/ // Retrieve the BidiLevel FSM const CBiDiFSM* CUniscribe::GetFSM () { if (!_pFSM) { _pFSM = new CBiDiFSM(this); if (_pFSM && !_pFSM->Init()) { delete _pFSM; } } return _pFSM; } // Prepare the shapeable font ready to dc for a given script // // USP_E_SCRIPT_NOT_IN_FONT - complex scripts font association // E_PENDING - prepare dc with current font selected // HDC CUniscribe::PrepareShapeDC ( PLSRUN plsrun, // in: The first run to be shaped CMeasurer* pme, // in: Measurer points to start cp of the run HRESULT hrReq, // in: Error code to react HFONT& hOrgFont) // in/out: Original font of the shape DC { Assert (pme); HDC hdc = NULL; HFONT hOldFont; switch (hrReq) { case USP_E_SCRIPT_NOT_IN_FONT: { pme->ApplyFontCache(fTrue, plsrun->_a.eScript); #ifdef DEBUG if (pme->_pccs) Tracef(TRCSEVWARN, "USP_E_SCRIPT_NOT_IN_FONT: charset %d applied", pme->_pccs->_bCharSet); #endif } default: if (pme->_pccs) { hdc = pme->_pccs->_hdc; hOldFont = (HFONT)SelectObject(hdc, pme->_pccs->_hfont); if (!hOrgFont) hOrgFont = hOldFont; } } return hdc; } const SCRIPT_PROPERTIES* CUniscribe::GeteProp (WORD eScript) { if (!_ppProp) { if (!SUCCEEDED(ScriptGetProperties(&_ppProp, NULL)) || !_ppProp) _ppProp = g_pPropUndef; } if (_ppProp == g_pPropUndef || eScript >= (WORD)g_cMaxScript) eScript = 0; return _ppProp[eScript]; } // Figure proper charset to use for complex script. // The resulted charset can be either actual or virtual (internal) GDI charset used by given script BOOL CUniscribe::GetComplexCharRep( const SCRIPT_PROPERTIES* psp, // Uniscribe script's properties BYTE iCharRepDefault, // -1 format's charset BYTE& iCharRepOut) // out: Charset to use { Assert(psp); BYTE iCharRep = !psp->fCDM ? CharRepFromCharSet(psp->bCharSet) : GetCDMCharRep(iCharRepDefault); BOOL fr = psp->fComplex && !psp->fControl; if (fr) { if (iCharRep == ANSI_INDEX || iCharRep == DEFAULT_INDEX) iCharRep = CharRepFromLID(psp->langid); if (IsBiDiCharRep(iCharRep)) _iCharRepRtl = iCharRep; // Cache the last found BiDi charset iCharRepOut = iCharRep; } return fr; } // Figure out the charset to use for CDM run // BYTE CUniscribe::GetCDMCharRep( BYTE iCharRepDefault) { if (!_iCharRepCDM) { _iCharRepCDM = (iCharRepDefault == VIET_INDEX || W32->GetPreferredKbd(VIET_INDEX) || GetLocaleCharRep() == VIET_INDEX || GetACP() == 1258) ? VIET_INDEX : DEFAULT_INDEX; } return _iCharRepCDM; } BYTE CUniscribe::GetRtlCharRep( CTxtEdit* ped, CRchTxtPtr* prtp) // ptr to the numeric run { CFormatRunPtr rp(prtp->_rpCF); rp.AdjustBackward(); BYTE iCharRep = ped->GetCharFormat(rp.GetFormat())->_iCharRep; if (!IsBiDiCharRep(iCharRep)) { iCharRep = _iCharRepRtl; // Use the last found BiDi charset if (!IsBiDiCharRep(iCharRep)) { // try default charset DWORD dwCharFlags; iCharRep = ped->GetCharFormat(-1)->_iCharRep; if (!IsBiDiCharRep(iCharRep)) { // Then the system charset iCharRep = CharRepFromCodePage(GetACP()); if (!IsBiDiCharRep(iCharRep)) { // Then the content dwCharFlags = ped->GetCharFlags() & (FARABIC | FHEBREW); if (dwCharFlags == FARABIC) iCharRep = ARABIC_INDEX; else if(dwCharFlags == FHEBREW) iCharRep = HEBREW_INDEX; else { // And last chance with the first found loaded BiDi kbd if (W32->GetPreferredKbd(HEBREW_INDEX)) iCharRep = HEBREW_INDEX; else // Even if we can't find Arabic, we have to assume it here. iCharRep = ARABIC_INDEX; } } } } } Assert(IsBiDiCharRep(iCharRep)); return iCharRep; } // Substitute digit shaper in plsrun if needed // void CUniscribe::SubstituteDigitShaper ( PLSRUN plsrun, CMeasurer* pme) { Assert(plsrun && pme); CTxtEdit* ped = pme->GetPed(); WORD wScript; if (GeteProp(plsrun->_a.eScript)->fNumeric) { wScript = plsrun->_pCF->_wScript; // reset it before switch (W32->GetDigitSubstitutionMode()) { case DIGITS_CTX: { if (ped->IsRich()) { // Context mode simply means the charset of the kbd for richtext. if (!IsBiDiCharRep(ped->GetCharFormat(pme->_rpCF.GetFormat())->_iCharRep)) break; } else { // Digit follows directionality of preceding run for plain text CFormatRunPtr rp(pme->_rpCF); Assert(rp.IsValid()); if (rp.PrevRun()) { if (!IsBiDiCharRep(ped->GetCharFormat(rp.GetFormat())->_iCharRep)) break; } else { // No preceding run, looking for the paragraph direction if (!pme->Get_pPF()->IsRtl()) break; } } // otherwise, fall thru... } case DIGITS_NATIONAL: wScript = _wesNationalDigit; default: break; } // Update all linked runs while (plsrun) { plsrun->_a.eScript = wScript; // assign proper shaping engine to digits plsrun = plsrun->_pNext; } } } /***** Uniscribe entry point *****/ // memory allocator // BOOL CUniscribe::CreateClientStruc ( BYTE* pbBufIn, LONG cbBufIn, PUSP_CLIENT* ppc, LONG cchString, DWORD dwMask) { Assert(ppc && pbBufIn); if (!ppc) return FALSE; *ppc = NULL; if (cchString == 0) cchString = 1; // simplify caller's logic LONG i; LONG cbSize; PBYTE pbBlock; // ScriptItemize's // PVOID pvString; PVOID pvsi; // ScriptBreak's // PVOID pvsla; // ScriptShape & Place's // PVOID pvwgi; PVOID pvsva; PVOID pvcluster; PVOID pvidx; PVOID pvgoffset; // subtable ptrs // PUSP_CLIENT_SI pc_si; PUSP_CLIENT_SB pc_sb; PUSP_CLIENT_SSP pc_ssp; #define RQ_COUNT 12 BUF_REQ brq[RQ_COUNT] = { // table and subtable blocks // { sizeof(USP_CLIENT), 1, (void**)ppc}, { sizeof(USP_CLIENT_SI), dwMask & cli_Itemize ? 1 : 0, (void**)&pc_si}, { sizeof(USP_CLIENT_SB), dwMask & cli_Break ? 1 : 0, (void**)&pc_sb}, { sizeof(USP_CLIENT_SSP), dwMask & cli_ShapePlace ? 1 : 0, (void**)&pc_ssp}, // data blocks // { sizeof(WCHAR), dwMask & cli_string ? cchString + 1 : 0, &pvString}, { sizeof(SCRIPT_ITEM), dwMask & cli_psi ? cchString + 1 : 0, &pvsi}, { sizeof(SCRIPT_LOGATTR), dwMask & cli_psla ? cchString + 1 : 0, &pvsla}, { sizeof(WORD), dwMask & cli_pwgi ? GLYPH_COUNT(cchString+1) : 0, &pvwgi}, { sizeof(SCRIPT_VISATTR), dwMask & cli_psva ? GLYPH_COUNT(cchString+1) : 0, &pvsva}, { sizeof(WORD), dwMask & cli_pcluster ? cchString + 1 : 0, &pvcluster}, { sizeof(int), dwMask & cli_pidx ? GLYPH_COUNT(cchString+1) : 0, &pvidx}, { sizeof(GOFFSET), dwMask & cli_pgoffset ? GLYPH_COUNT(cchString+1) : 0, &pvgoffset}, }; // count total buffer size in byte (WORD aligned) // for (i=0, cbSize=0; i < RQ_COUNT; i++) { cbSize += ALIGN(brq[i].size * brq[i].c); } // allocate the whole buffer at once // if (cbSize > cbBufIn) { pbBlock = (PBYTE)PvAlloc(cbSize, 0); } else { pbBlock = pbBufIn; } if (!pbBlock) { // // memory management failed! // TRACEERRORSZ("Allocation failed in CreateClientStruc!\n"); *ppc = NULL; return FALSE; } // clear the main table ZeroMemory (pbBlock, sizeof(USP_CLIENT)); // assign ptrs in buffer request structure // for (i=0; i < RQ_COUNT; i++) { if (brq[i].c > 0) { *brq[i].ppv = pbBlock; pbBlock += ALIGN(brq[i].size * brq[i].c); } else { *brq[i].ppv = NULL; } } Assert(((PBYTE)(*ppc)+cbSize == pbBlock)); // fill in data block ptrs in subtable // if (pc_si) { pc_si->pwchString = (WCHAR*) pvString; pc_si->cchString = cchString; pc_si->psi = (SCRIPT_ITEM*) pvsi; } if (pc_sb) { pc_sb->psla = (SCRIPT_LOGATTR*) pvsla; } if (pc_ssp) { pc_ssp->pwgi = (WORD*) pvwgi; pc_ssp->psva = (SCRIPT_VISATTR*) pvsva; pc_ssp->pcluster = (WORD*) pvcluster; pc_ssp->pidx = (int*) pvidx; pc_ssp->pgoffset = (GOFFSET*) pvgoffset; } // fill in subtable ptrs in header table // (*ppc)->si = (PUSP_CLIENT_SI) pc_si; (*ppc)->sb = (PUSP_CLIENT_SB) pc_sb; (*ppc)->ssp = (PUSP_CLIENT_SSP) pc_ssp; return TRUE; } /////// CBidiFSM class implementation // // Create: Worachai Chaoweeraprasit(wchao), Jan 29, 1998 // CBiDiFSM::~CBiDiFSM () { FreePv(_pStart); } INPUT_CLASS CBiDiFSM::InputClass ( const CCharFormat* pCF, CTxtPtr* ptp, LONG cchRun) const { if (!_pusp->IsValid() || !pCF || pCF->_wScript == SCRIPT_WHITE) return chGround; const SCRIPT_PROPERTIES* psp = _pusp->GeteProp(pCF->_wScript); BYTE iCharRep = pCF->_iCharRep; if (psp->fControl) { if (cchRun == 1) switch (ptp->GetChar()) // single-char run { case LTRMARK: return chLTR; // \ltrmark case RTLMARK: return chRTL; // \rtlmark } return chGround; } if(IsSymbolOrOEMCharRep(iCharRep) || IsFECharRep(iCharRep) || pCF->_dwEffects & CFE_RUNISDBCS) return chLTR; BOOL fBiDiCharSet = IsBiDiCharSet(psp->bCharSet); if (psp->fNumeric) // Numeric digits return (fBiDiCharSet || IsBiDiCharRep(iCharRep)) ? digitRTL : digitLTR; // RTL if it's RTL script or its format charset is RTL and NOT a simplified script return (fBiDiCharSet || pCF->_wScript && IsBiDiCharRep(iCharRep)) ? chRTL : chLTR; } // The FSM generates run's embedding level based on given base level and puts it // in CFormatRun. LsFetchRun is the client using this result. // #ifdef DEBUG //#define DEBUG_LEVEL #endif #ifdef DEBUG_LEVEL void DebugLevel (CBiDiFSMCell* pCell) { Tracef(TRCSEVNONE, "%d,", pCell->_level._value); } #else #define DebugLevel(x) #endif HRESULT CBiDiFSM::RunFSM ( CRchTxtPtr* prtp, // in: text pointer to start run LONG cRuns, // in: number of FSM run LONG cRunsStart, // in: number of start run BYTE bBaseLevel) const // in: base level { Assert (prtp->_rpCF.IsValid() && cRuns > 0); CRchTxtPtr rtp(*prtp); const CCharFormat* pCF; LONG cchRun; LONG cRunsAll = cRuns + cRunsStart; CBiDiFSMCell* pCell; USHORT ucState = bBaseLevel ? S_X * NUM_FSM_INPUTS : 0; BOOL fNext = TRUE; // loop thru FSM for (; fNext && cRunsAll > 0; cRunsAll--, fNext = !!rtp.Move(cchRun)) { cchRun = rtp.GetCchLeftRunCF(); pCF = rtp.GetPed()->GetCharFormat(rtp._rpCF.GetFormat()); ucState += InputClass(pCF, &rtp._rpTX, cchRun); pCell = &_pStart[ucState]; // set level to FSM runs if (cRunsAll <= cRuns) rtp._rpCF.SetLevel (pCell->_level); DebugLevel(pCell); ucState = pCell->_uNext; // next state } return S_OK; } // Construct the BiDi embedding level FSM (FSM details see bidifsm2.html) // :FSM's size = NUM_FSM_INPUTS * NUM_FSM_STATES * sizeof(CBiDiFSMCell) = 6*5*4 = 120 bytes // BOOL CBiDiFSM::Init() { CBiDiFSMCell* pCell; int i; // Build the Bidi FSM _nState = NUM_FSM_STATES; _nInput = NUM_FSM_INPUTS; pCell = (CBiDiFSMCell*)PvAlloc(NUM_FSM_STATES * NUM_FSM_INPUTS * sizeof(CBiDiFSMCell), 0); if (!pCell) return FALSE; // unable to create FSM! _pStart = pCell; CBiDiLevel lvlZero = {0,0}; CBiDiLevel lvlOne = {1,0}; CBiDiLevel lvlTwo = {2,0}; CBiDiLevel lvlTwoStart = {2,1}; // State A(0): LTR char in LTR para // for (i=0; i < NUM_FSM_INPUTS; i++, pCell++) { switch (i) { case chLTR: SetFSMCell(pCell, &lvlZero, 0); break; case chRTL: SetFSMCell(pCell, &lvlOne, S_B * NUM_FSM_INPUTS); break; case digitLTR: SetFSMCell(pCell, &lvlZero, 0); break; case digitRTL: SetFSMCell(pCell, &lvlTwo, S_C * NUM_FSM_INPUTS); break; case chGround: SetFSMCell(pCell, &lvlZero, 0); break; } } // State B(1): RTL char in LTR para // for (i=0; i < NUM_FSM_INPUTS; i++, pCell++) { switch (i) { case chLTR: SetFSMCell(pCell, &lvlZero, 0); break; case chRTL: SetFSMCell(pCell, &lvlOne, S_B * NUM_FSM_INPUTS); break; case digitLTR: SetFSMCell(pCell, &lvlZero, 0); break; case digitRTL: SetFSMCell(pCell, &lvlTwo, S_C * NUM_FSM_INPUTS); break; case chGround: SetFSMCell(pCell, &lvlZero, 0); break; } } // State C(2): RTL number run in LTR para // for (i=0; i < NUM_FSM_INPUTS; i++, pCell++) { switch (i) { case chLTR: SetFSMCell(pCell, &lvlZero, 0); break; case chRTL: SetFSMCell(pCell, &lvlOne, S_B * NUM_FSM_INPUTS); break; case digitLTR: SetFSMCell(pCell, &lvlZero, 0); break; case digitRTL: SetFSMCell(pCell, &lvlTwo, S_C * NUM_FSM_INPUTS); break; case chGround: SetFSMCell(pCell, &lvlZero, 0); break; } } // State X(1): RTL char in RTL para // for (i=0; i < NUM_FSM_INPUTS; i++, pCell++) { switch (i) { case chLTR: SetFSMCell(pCell, &lvlTwo, S_Y * NUM_FSM_INPUTS); break; case chRTL: SetFSMCell(pCell, &lvlOne, S_X * NUM_FSM_INPUTS); break; case digitLTR: SetFSMCell(pCell, &lvlTwo, S_Y * NUM_FSM_INPUTS); break; case digitRTL: SetFSMCell(pCell, &lvlTwo, S_Z * NUM_FSM_INPUTS); break; case chGround: SetFSMCell(pCell, &lvlOne, S_X * NUM_FSM_INPUTS); break; } } // State Y(2): LTR char in RTL para // for (i=0; i < NUM_FSM_INPUTS; i++, pCell++) { switch (i) { case chLTR: SetFSMCell(pCell, &lvlTwo, S_Y * NUM_FSM_INPUTS); break; case chRTL: SetFSMCell(pCell, &lvlOne, S_X * NUM_FSM_INPUTS); break; case digitLTR: SetFSMCell(pCell, &lvlTwo, S_Y * NUM_FSM_INPUTS); break; case digitRTL: SetFSMCell(pCell, &lvlTwoStart, S_Z * NUM_FSM_INPUTS); break; case chGround: SetFSMCell(pCell, &lvlOne, S_X * NUM_FSM_INPUTS); break; } } // State Z(2): RTL number in RTL para // for (i=0; i < NUM_FSM_INPUTS; i++, pCell++) { switch (i) { case chLTR: SetFSMCell(pCell, &lvlTwoStart, S_Y * NUM_FSM_INPUTS); break; case chRTL: SetFSMCell(pCell, &lvlOne, S_X * NUM_FSM_INPUTS); break; case digitLTR: SetFSMCell(pCell, &lvlTwoStart, S_Y * NUM_FSM_INPUTS); break; case digitRTL: SetFSMCell(pCell, &lvlTwo, S_Z * NUM_FSM_INPUTS); break; case chGround: SetFSMCell(pCell, &lvlOne, S_X * NUM_FSM_INPUTS); break; } } AssertSz(&pCell[-(NUM_FSM_STATES * NUM_FSM_INPUTS)] == _pStart, "Bidi FSM incomplete constructed!"); return TRUE; } /////// CCallbackBufferBase class implementation // void* CBufferBase::GetPtr(int cel) { if (_cElem < cel) { cel += celAdvance; _p = PvReAlloc(_p, cel * _cbElem); if (!_p) return NULL; ZeroMemory(_p, cel * _cbElem); _cElem = cel; } return _p; } void CBufferBase::Release() { if (_p) FreePv(_p); } #endif // NOCOMPLEXSCRIPTS