mirror of
https://github.com/mozilla/gecko-dev.git
synced 2024-11-06 17:16:12 +00:00
180 lines
7.4 KiB
C++
180 lines
7.4 KiB
C++
/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*-
|
|
* ***** BEGIN LICENSE BLOCK *****
|
|
* Version: MPL 1.1/GPL 2.0/LGPL 2.1
|
|
*
|
|
* The contents of this file are subject to the Mozilla Public License Version
|
|
* 1.1 (the "License"); you may not use this file except in compliance with
|
|
* the License. You may obtain a copy of the License at
|
|
* http://www.mozilla.org/MPL/
|
|
*
|
|
* Software distributed under the License is distributed on an "AS IS" basis,
|
|
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
|
|
* for the specific language governing rights and limitations under the
|
|
* License.
|
|
*
|
|
* The Original Code is Novell code.
|
|
*
|
|
* The Initial Developer of the Original Code is Novell Corporation.
|
|
* Portions created by the Initial Developer are Copyright (C) 2006
|
|
* the Initial Developer. All Rights Reserved.
|
|
*
|
|
* Contributor(s):
|
|
* robert@ocallahan.org
|
|
*
|
|
* Alternatively, the contents of this file may be used under the terms of
|
|
* either the GNU General Public License Version 2 or later (the "GPL"), or
|
|
* the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
|
|
* in which case the provisions of the GPL or the LGPL are applicable instead
|
|
* of those above. If you wish to allow use of your version of this file only
|
|
* under the terms of either the GPL or the LGPL, and not to allow others to
|
|
* use your version of this file under the terms of the MPL, indicate your
|
|
* decision by deleting the provisions above and replace them with the notice
|
|
* and other provisions required by the GPL or the LGPL. If you do not delete
|
|
* the provisions above, a recipient may use your version of this file under
|
|
* the terms of any one of the MPL, the GPL or the LGPL.
|
|
*
|
|
* ***** END LICENSE BLOCK ***** */
|
|
|
|
#ifndef NSTEXTFRAMEUTILS_H_
|
|
#define NSTEXTFRAMEUTILS_H_
|
|
|
|
#include "gfxFont.h"
|
|
#include "gfxSkipChars.h"
|
|
#include "nsTextFragment.h"
|
|
|
|
#define BIG_TEXT_NODE_SIZE 4096
|
|
|
|
class nsTextFrameUtils {
|
|
public:
|
|
// These constants are used as textrun flags for textframe textruns.
|
|
enum {
|
|
// The following flags are set by TransformText
|
|
|
|
// the text has at least one untransformed tab character
|
|
TEXT_HAS_TAB = 0x010000,
|
|
// the original text has at least one soft hyphen character
|
|
TEXT_HAS_SHY = 0x020000,
|
|
TEXT_HAS_NON_ASCII = 0x040000,
|
|
TEXT_WAS_TRANSFORMED = 0x080000,
|
|
|
|
// The following flags are set by nsTextFrame
|
|
|
|
TEXT_IS_SIMPLE_FLOW = 0x100000,
|
|
TEXT_INCOMING_WHITESPACE = 0x200000
|
|
};
|
|
|
|
static PRBool
|
|
IsPunctuationMark(PRUnichar aChar);
|
|
|
|
/**
|
|
* Returns PR_TRUE if aChars/aLength are something that make a space
|
|
* character not be whitespace when they follow the space character.
|
|
* For now, this is true if and only if aChars starts with a ZWJ. (This
|
|
* is what Uniscribe assumes.)
|
|
*/
|
|
static PRBool
|
|
IsSpaceCombiningSequenceTail(const PRUnichar* aChars, PRInt32 aLength) {
|
|
return aLength > 0 && aChars[0] == 0x200D; // ZWJ
|
|
}
|
|
|
|
/**
|
|
* Create a text run from a run of Unicode text. The text may have whitespace
|
|
* compressed. A preformatted tab is sent to the text run as a single space.
|
|
* (Tab spacing must be performed by textframe later.) Certain other
|
|
* characters are discarded.
|
|
*
|
|
* @param aCompressWhitespace runs of consecutive whitespace (spaces not
|
|
* followed by a diacritical mark, tabs, and newlines) are compressed to a
|
|
* single space character.
|
|
*/
|
|
static PRUnichar* TransformText(const PRUnichar* aText, PRUint32 aLength,
|
|
PRUnichar* aOutput,
|
|
PRBool aCompressWhitespace,
|
|
PRPackedBool* aIncomingWhitespace,
|
|
gfxSkipCharsBuilder* aSkipChars,
|
|
PRUint32* aAnalysisFlags);
|
|
|
|
static PRUint8* TransformText(const PRUint8* aText, PRUint32 aLength,
|
|
PRUint8* aOutput,
|
|
PRBool aCompressWhitespace,
|
|
PRPackedBool* aIncomingWhitespace,
|
|
gfxSkipCharsBuilder* aSkipChars,
|
|
PRUint32* aAnalysisFlags);
|
|
|
|
/**
|
|
* Find a word boundary starting from a given position and proceeding either
|
|
* forwards (aDirection == 1) or backwards (aDirection == -1). The search
|
|
* is limited to a substring of an nsTextFragment. We return the index
|
|
* of the character that is the first character of the next/prev word; the
|
|
* result can be aOffset <= result <= aLength (result == aLength means
|
|
* that there's definitely a word boundary at the end of the text), or -1 to
|
|
* indicate that no boundary was found.
|
|
*
|
|
* @param aTextRun a text run which we will use to ensure that we don't
|
|
* return a boundary inside a cluster
|
|
* @param aPosition a character in the substring aOffset/aLength
|
|
* @param aBreakBeforePunctuation if true, then we allow a word break
|
|
* when transitioning from regular word text to punctuation (in content order)
|
|
* @param aBreakAfterPunctuation if true, then we allow a word break
|
|
* when transitioning from punctuation to regular word text (in content order)
|
|
* @param aWordIsWhitespace we set this to true if the word-part we skipped
|
|
* over is whitespace
|
|
*
|
|
* For the above properties, "punctuation" is defined as any ASCII character
|
|
* which is not a letter or a digit. Regular word text is any non-whitespace
|
|
* (here "whitespace" includes non-breaking whitespace).
|
|
* Word break points are the punctuation breaks defined above, plus
|
|
* for Unicode text, whatever intl's wordbreaker identifies, and for
|
|
* ASCII text, boundaries between whitespace and non-whitespace.
|
|
*/
|
|
static PRInt32
|
|
FindWordBoundary(const nsTextFragment* aText,
|
|
gfxTextRun* aTextRun,
|
|
gfxSkipCharsIterator* aIterator,
|
|
PRInt32 aOffset, PRInt32 aLength,
|
|
PRInt32 aPosition, PRInt32 aDirection,
|
|
PRBool aBreakBeforePunctuation,
|
|
PRBool aBreakAfterPunctuation,
|
|
PRBool* aWordIsWhitespace);
|
|
};
|
|
|
|
class nsSkipCharsRunIterator {
|
|
public:
|
|
enum LengthMode {
|
|
LENGTH_UNSKIPPED_ONLY = PR_FALSE,
|
|
LENGTH_INCLUDES_SKIPPED = PR_TRUE
|
|
};
|
|
nsSkipCharsRunIterator(const gfxSkipCharsIterator& aStart,
|
|
LengthMode aLengthIncludesSkipped, PRUint32 aLength)
|
|
: mIterator(aStart), mRemainingLength(aLength), mRunLength(0),
|
|
mVisitSkipped(PR_FALSE),
|
|
mLengthIncludesSkipped(aLengthIncludesSkipped) {
|
|
}
|
|
void SetVisitSkipped() { mVisitSkipped = PR_TRUE; }
|
|
void SetOriginalOffset(PRInt32 aOffset) {
|
|
mIterator.SetOriginalOffset(aOffset);
|
|
}
|
|
void SetSkippedOffset(PRUint32 aOffset) {
|
|
mIterator.SetSkippedOffset(aOffset);
|
|
}
|
|
|
|
// guaranteed to return only positive-length runs
|
|
PRBool NextRun();
|
|
PRBool IsSkipped() const { return mSkipped; }
|
|
// Always returns something > 0
|
|
PRInt32 GetRunLength() const { return mRunLength; }
|
|
const gfxSkipCharsIterator& GetPos() const { return mIterator; }
|
|
PRInt32 GetOriginalOffset() const { return mIterator.GetOriginalOffset(); }
|
|
PRUint32 GetSkippedOffset() const { return mIterator.GetSkippedOffset(); }
|
|
|
|
private:
|
|
gfxSkipCharsIterator mIterator;
|
|
PRInt32 mRemainingLength;
|
|
PRInt32 mRunLength;
|
|
PRPackedBool mSkipped;
|
|
PRPackedBool mVisitSkipped;
|
|
PRPackedBool mLengthIncludesSkipped;
|
|
};
|
|
|
|
#endif /*NSTEXTFRAMEUTILS_H_*/
|