#ifndef TextBreakIterator_h
#define TextBreakIterator_h
#include "platform/PlatformExport.h"
#include "wtf/text/AtomicString.h"
#include "wtf/unicode/Unicode.h"
#include <unicode/brkiter.h>
namespace WebCore {
typedef icu::BreakIterator TextBreakIterator;
PLATFORM_EXPORT TextBreakIterator* cursorMovementIterator(const UChar*, int length);
PLATFORM_EXPORT TextBreakIterator* wordBreakIterator(const String&, int start, int length);
PLATFORM_EXPORT TextBreakIterator* wordBreakIterator(const UChar*, int length);
PLATFORM_EXPORT TextBreakIterator* acquireLineBreakIterator(const LChar*, int length, const AtomicString& locale, const UChar* priorContext, unsigned priorContextLength);
PLATFORM_EXPORT TextBreakIterator* acquireLineBreakIterator(const UChar*, int length, const AtomicString& locale, const UChar* priorContext, unsigned priorContextLength);
PLATFORM_EXPORT void releaseLineBreakIterator(TextBreakIterator*);
PLATFORM_EXPORT TextBreakIterator* sentenceBreakIterator(const UChar*, int length);
PLATFORM_EXPORT bool isWordTextBreak(TextBreakIterator*);
const int TextBreakDone = -1;
class PLATFORM_EXPORT LazyLineBreakIterator {
public:
LazyLineBreakIterator()
: m_iterator(0)
, m_cachedPriorContext(0)
, m_cachedPriorContextLength(0)
{
resetPriorContext();
}
LazyLineBreakIterator(String string, const AtomicString& locale = AtomicString())
: m_string(string)
, m_locale(locale)
, m_iterator(0)
, m_cachedPriorContext(0)
, m_cachedPriorContextLength(0)
{
resetPriorContext();
}
~LazyLineBreakIterator()
{
if (m_iterator)
releaseLineBreakIterator(m_iterator);
}
String string() const { return m_string; }
UChar lastCharacter() const
{
COMPILE_ASSERT(WTF_ARRAY_LENGTH(m_priorContext) == 2, TextBreakIterator_unexpected_prior_context_length);
return m_priorContext[1];
}
UChar secondToLastCharacter() const
{
COMPILE_ASSERT(WTF_ARRAY_LENGTH(m_priorContext) == 2, TextBreakIterator_unexpected_prior_context_length);
return m_priorContext[0];
}
void setPriorContext(UChar last, UChar secondToLast)
{
COMPILE_ASSERT(WTF_ARRAY_LENGTH(m_priorContext) == 2, TextBreakIterator_unexpected_prior_context_length);
m_priorContext[0] = secondToLast;
m_priorContext[1] = last;
}
void updatePriorContext(UChar last)
{
COMPILE_ASSERT(WTF_ARRAY_LENGTH(m_priorContext) == 2, TextBreakIterator_unexpected_prior_context_length);
m_priorContext[0] = m_priorContext[1];
m_priorContext[1] = last;
}
void resetPriorContext()
{
COMPILE_ASSERT(WTF_ARRAY_LENGTH(m_priorContext) == 2, TextBreakIterator_unexpected_prior_context_length);
m_priorContext[0] = 0;
m_priorContext[1] = 0;
}
unsigned priorContextLength() const
{
unsigned priorContextLength = 0;
COMPILE_ASSERT(WTF_ARRAY_LENGTH(m_priorContext) == 2, TextBreakIterator_unexpected_prior_context_length);
if (m_priorContext[1]) {
++priorContextLength;
if (m_priorContext[0])
++priorContextLength;
}
return priorContextLength;
}
TextBreakIterator* get(unsigned priorContextLength)
{
ASSERT(priorContextLength <= priorContextCapacity);
const UChar* priorContext = priorContextLength ? &m_priorContext[priorContextCapacity - priorContextLength] : 0;
if (!m_iterator) {
if (m_string.is8Bit())
m_iterator = acquireLineBreakIterator(m_string.characters8(), m_string.length(), m_locale, priorContext, priorContextLength);
else
m_iterator = acquireLineBreakIterator(m_string.characters16(), m_string.length(), m_locale, priorContext, priorContextLength);
m_cachedPriorContext = priorContext;
m_cachedPriorContextLength = priorContextLength;
} else if (priorContext != m_cachedPriorContext || priorContextLength != m_cachedPriorContextLength) {
this->resetStringAndReleaseIterator(m_string, m_locale);
return this->get(priorContextLength);
}
return m_iterator;
}
void resetStringAndReleaseIterator(String string, const AtomicString& locale)
{
if (m_iterator)
releaseLineBreakIterator(m_iterator);
m_string = string;
m_locale = locale;
m_iterator = 0;
m_cachedPriorContext = 0;
m_cachedPriorContextLength = 0;
}
private:
static const unsigned priorContextCapacity = 2;
String m_string;
AtomicString m_locale;
TextBreakIterator* m_iterator;
UChar m_priorContext[priorContextCapacity];
const UChar* m_cachedPriorContext;
unsigned m_cachedPriorContextLength;
};
class PLATFORM_EXPORT NonSharedCharacterBreakIterator {
WTF_MAKE_NONCOPYABLE(NonSharedCharacterBreakIterator);
public:
explicit NonSharedCharacterBreakIterator(const String&);
NonSharedCharacterBreakIterator(const UChar*, unsigned length);
~NonSharedCharacterBreakIterator();
int next();
int current();
bool isBreak(int offset) const;
int preceding(int offset) const;
int following(int offset) const;
bool operator!() const
{
return !m_is8Bit && !m_iterator;
}
private:
void createIteratorForBuffer(const UChar*, unsigned length);
unsigned clusterLengthStartingAt(unsigned offset) const
{
ASSERT(m_is8Bit);
return isCRBeforeLF(offset) ? 2 : 1;
}
bool isCRBeforeLF(unsigned offset) const
{
ASSERT(m_is8Bit);
return m_charaters8[offset] == '\r' && offset + 1 < m_length && m_charaters8[offset + 1] == '\n';
}
bool isLFAfterCR(unsigned offset) const
{
ASSERT(m_is8Bit);
return m_charaters8[offset] == '\n' && offset >= 1 && m_charaters8[offset - 1] == '\r';
}
bool m_is8Bit;
const LChar* m_charaters8;
unsigned m_offset;
unsigned m_length;
TextBreakIterator* m_iterator;
};
PLATFORM_EXPORT unsigned numGraphemeClusters(const String&);
PLATFORM_EXPORT unsigned numCharactersInGraphemeClusters(const String&, unsigned);
}
#endif