2008-09-30 17:50:42 -07:00
|
|
|
/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
|
2012-05-21 04:12:37 -07:00
|
|
|
/* This Source Code Form is subject to the terms of the Mozilla Public
|
|
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */
|
2007-03-22 10:30:00 -07:00
|
|
|
|
|
|
|
#ifndef nsUnicharUtils_h__
|
|
|
|
#define nsUnicharUtils_h__
|
|
|
|
|
|
|
|
#include "nsStringGlue.h"
|
|
|
|
|
|
|
|
/* (0x3131u <= (u) && (u) <= 0x318eu) => Hangul Compatibility Jamo */
|
|
|
|
/* (0xac00u <= (u) && (u) <= 0xd7a3u) => Hangul Syllables */
|
|
|
|
#define IS_CJ_CHAR(u) \
|
|
|
|
((0x2e80u <= (u) && (u) <= 0x312fu) || \
|
|
|
|
(0x3190u <= (u) && (u) <= 0xabffu) || \
|
|
|
|
(0xf900u <= (u) && (u) <= 0xfaffu) || \
|
|
|
|
(0xff00u <= (u) && (u) <= 0xffefu) )
|
|
|
|
|
|
|
|
void ToLowerCase(nsAString&);
|
|
|
|
void ToUpperCase(nsAString&);
|
|
|
|
|
|
|
|
void ToLowerCase(const nsAString& aSource, nsAString& aDest);
|
|
|
|
void ToUpperCase(const nsAString& aSource, nsAString& aDest);
|
|
|
|
|
2012-08-22 08:56:38 -07:00
|
|
|
uint32_t ToLowerCase(uint32_t);
|
|
|
|
uint32_t ToUpperCase(uint32_t);
|
|
|
|
uint32_t ToTitleCase(uint32_t);
|
2010-07-29 12:22:16 -07:00
|
|
|
|
2012-08-22 08:56:38 -07:00
|
|
|
void ToLowerCase(const PRUnichar*, PRUnichar*, uint32_t);
|
|
|
|
void ToUpperCase(const PRUnichar*, PRUnichar*, uint32_t);
|
2007-03-22 10:30:00 -07:00
|
|
|
|
2012-08-22 08:56:38 -07:00
|
|
|
inline bool IsUpperCase(uint32_t c) {
|
2007-03-22 10:30:00 -07:00
|
|
|
return ToLowerCase(c) != c;
|
|
|
|
}
|
|
|
|
|
2012-08-22 08:56:38 -07:00
|
|
|
inline bool IsLowerCase(uint32_t c) {
|
2007-03-22 10:30:00 -07:00
|
|
|
return ToUpperCase(c) != c;
|
|
|
|
}
|
|
|
|
|
|
|
|
#ifdef MOZILLA_INTERNAL_API
|
|
|
|
|
|
|
|
class nsCaseInsensitiveStringComparator : public nsStringComparator
|
|
|
|
{
|
|
|
|
public:
|
2012-08-22 08:56:38 -07:00
|
|
|
virtual int32_t operator() (const PRUnichar*,
|
2010-07-29 12:22:16 -07:00
|
|
|
const PRUnichar*,
|
2012-08-22 08:56:38 -07:00
|
|
|
uint32_t,
|
|
|
|
uint32_t) const;
|
2010-08-31 18:03:40 -07:00
|
|
|
};
|
|
|
|
|
|
|
|
class nsCaseInsensitiveUTF8StringComparator : public nsCStringComparator
|
|
|
|
{
|
|
|
|
public:
|
2012-08-22 08:56:38 -07:00
|
|
|
virtual int32_t operator() (const char*,
|
2010-08-31 18:03:40 -07:00
|
|
|
const char*,
|
2012-08-22 08:56:38 -07:00
|
|
|
uint32_t,
|
|
|
|
uint32_t) const;
|
2007-03-22 10:30:00 -07:00
|
|
|
};
|
|
|
|
|
2008-09-30 17:50:42 -07:00
|
|
|
class nsCaseInsensitiveStringArrayComparator
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
template<class A, class B>
|
2011-09-28 23:19:26 -07:00
|
|
|
bool Equals(const A& a, const B& b) const {
|
2008-09-30 17:50:42 -07:00
|
|
|
return a.Equals(b, nsCaseInsensitiveStringComparator());
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2010-08-02 15:19:04 -07:00
|
|
|
class nsASCIICaseInsensitiveStringComparator : public nsStringComparator
|
|
|
|
{
|
|
|
|
public:
|
2011-03-24 17:01:47 -07:00
|
|
|
nsASCIICaseInsensitiveStringComparator() {}
|
2010-08-02 15:19:04 -07:00
|
|
|
virtual int operator() (const PRUnichar*,
|
|
|
|
const PRUnichar*,
|
2012-08-22 08:56:38 -07:00
|
|
|
uint32_t,
|
|
|
|
uint32_t) const;
|
2010-08-02 15:19:04 -07:00
|
|
|
};
|
|
|
|
|
2011-09-28 23:19:26 -07:00
|
|
|
inline bool
|
2007-03-22 10:30:00 -07:00
|
|
|
CaseInsensitiveFindInReadable(const nsAString& aPattern,
|
|
|
|
nsAString::const_iterator& aSearchStart,
|
|
|
|
nsAString::const_iterator& aSearchEnd)
|
|
|
|
{
|
|
|
|
return FindInReadable(aPattern, aSearchStart, aSearchEnd,
|
|
|
|
nsCaseInsensitiveStringComparator());
|
|
|
|
}
|
|
|
|
|
2011-09-28 23:19:26 -07:00
|
|
|
inline bool
|
2007-03-22 10:30:00 -07:00
|
|
|
CaseInsensitiveFindInReadable(const nsAString& aPattern,
|
|
|
|
const nsAString& aHay)
|
|
|
|
{
|
|
|
|
nsAString::const_iterator searchBegin, searchEnd;
|
|
|
|
return FindInReadable(aPattern, aHay.BeginReading(searchBegin),
|
|
|
|
aHay.EndReading(searchEnd),
|
|
|
|
nsCaseInsensitiveStringComparator());
|
|
|
|
}
|
|
|
|
|
2010-07-29 12:22:16 -07:00
|
|
|
#endif // MOZILLA_INTERNAL_API
|
2010-07-04 06:27:16 -07:00
|
|
|
|
2012-08-22 08:56:38 -07:00
|
|
|
int32_t
|
|
|
|
CaseInsensitiveCompare(const PRUnichar *a, const PRUnichar *b, uint32_t len);
|
2010-07-04 06:27:16 -07:00
|
|
|
|
2012-08-22 08:56:38 -07:00
|
|
|
int32_t
|
2010-08-31 18:03:40 -07:00
|
|
|
CaseInsensitiveCompare(const char* aLeft, const char* aRight,
|
2012-08-22 08:56:38 -07:00
|
|
|
uint32_t aLeftBytes, uint32_t aRightBytes);
|
2010-08-31 18:03:40 -07:00
|
|
|
|
|
|
|
/**
|
|
|
|
* This function determines whether the UTF-8 sequence pointed to by aLeft is
|
|
|
|
* case-insensitively-equal to the UTF-8 sequence pointed to by aRight.
|
|
|
|
*
|
|
|
|
* aLeftEnd marks the first memory location past aLeft that is not part of
|
|
|
|
* aLeft; aRightEnd similarly marks the end of aRight.
|
|
|
|
*
|
|
|
|
* The function assumes that aLeft < aLeftEnd and aRight < aRightEnd.
|
|
|
|
*
|
|
|
|
* The function stores the addresses of the next characters in the sequence
|
|
|
|
* into aLeftNext and aRightNext. It's up to the caller to make sure that the
|
|
|
|
* returned pointers are valid -- i.e. the function may return aLeftNext >=
|
|
|
|
* aLeftEnd or aRightNext >= aRightEnd.
|
|
|
|
*
|
|
|
|
* If the function encounters invalid text, it sets aErr to true and returns
|
|
|
|
* false, possibly leaving aLeftNext and aRightNext uninitialized. If the
|
|
|
|
* function returns true, aErr is guaranteed to be false and both aLeftNext and
|
|
|
|
* aRightNext are guaranteed to be initialized.
|
|
|
|
*/
|
2011-09-28 23:19:26 -07:00
|
|
|
bool
|
2010-08-31 18:03:40 -07:00
|
|
|
CaseInsensitiveUTF8CharsEqual(const char* aLeft, const char* aRight,
|
|
|
|
const char* aLeftEnd, const char* aRightEnd,
|
|
|
|
const char** aLeftNext, const char** aRightNext,
|
2011-09-28 23:19:26 -07:00
|
|
|
bool* aErr);
|
2010-08-31 18:03:40 -07:00
|
|
|
|
2012-03-12 15:53:18 -07:00
|
|
|
namespace mozilla {
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Hash a UTF8 string as though it were a UTF16 string.
|
|
|
|
*
|
|
|
|
* The value returned is the same as if we converted the string to UTF16 and
|
|
|
|
* then ran HashString() on the result.
|
|
|
|
*
|
|
|
|
* The given |length| is in bytes.
|
|
|
|
*/
|
2012-08-22 08:56:38 -07:00
|
|
|
uint32_t
|
|
|
|
HashUTF8AsUTF16(const char* aUTF8, uint32_t aLength, bool* aErr);
|
2012-03-12 15:53:18 -07:00
|
|
|
|
|
|
|
} // namespace mozilla
|
|
|
|
|
2007-03-22 10:30:00 -07:00
|
|
|
#endif /* nsUnicharUtils_h__ */
|