mirror of
https://github.com/mozilla/gecko-dev.git
synced 2024-12-11 16:32:59 +00:00
605 lines
18 KiB
C++
605 lines
18 KiB
C++
/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*-
|
|
*
|
|
* The contents of this file are subject to the Netscape Public
|
|
* License Version 1.1 (the "License"); you may not use this file
|
|
* except in compliance with the License. You may obtain a copy of
|
|
* the License at http://www.mozilla.org/NPL/
|
|
*
|
|
* Software distributed under the License is distributed on an "AS
|
|
* IS" basis, WITHOUT WARRANTY OF ANY KIND, either express or
|
|
* implied. See the License for the specific language governing
|
|
* rights and limitations under the License.
|
|
*
|
|
* The Original Code is mozilla.org code.
|
|
*
|
|
* The Initial Developer of the Original Code is Netscape
|
|
* Communications Corporation. Portions created by Netscape are
|
|
* Copyright (C) 1998 Netscape Communications Corporation. All
|
|
* Rights Reserved.
|
|
*
|
|
* Contributor(s):
|
|
*/
|
|
#include <iostream.h>
|
|
#include "nsIComponentManager.h"
|
|
#include "nsISupports.h"
|
|
#include "nsIServiceManager.h"
|
|
#include "nsILineBreakerFactory.h"
|
|
#include "nsILineBreaker.h"
|
|
#include "nsIWordBreakerFactory.h"
|
|
#include "nsIWordBreaker.h"
|
|
#include "nsIBreakState.h"
|
|
#include "nsLWBrkCIID.h"
|
|
|
|
#define WORK_AROUND_SERVICE_MANAGER_ASSERT
|
|
|
|
IMPL_NS_IBREAKSTATE( nsBreakState )
|
|
|
|
NS_DEFINE_CID(kLWBrkCID, NS_LWBRK_CID);
|
|
NS_DEFINE_IID(kILineBreakerFactory, NS_ILINEBREAKERFACTORY_IID);
|
|
NS_DEFINE_IID(kIWordBreakerFactory, NS_IWORDBREAKERFACTORY_IID);
|
|
|
|
|
|
static char teng1[] =
|
|
// 1 2 3 4 5 6 7
|
|
//01234567890123456789012345678901234567890123456789012345678901234567890123456789
|
|
"This is a test to test(reasonable) line break. This 0.01123 = 45 x 48.";
|
|
|
|
static PRUint32 exp1[] = {
|
|
4,5,7,8,9,10,14,15,17,18,22,34,35,39,40,41,42,43,49,50,54,55,62,63,64,65,
|
|
67,68,69,70
|
|
};
|
|
|
|
static PRUint32 wexp1[] = {
|
|
|
|
4,5,7,8,9,10,14,15,17,18,22,23,33,34,35,39,43,48,49,50,54,55,56,57,62,63,
|
|
64,65,67,68,69,70,72
|
|
};
|
|
// 1 2 3 4 5 6 7
|
|
//01234567890123456789012345678901234567890123456789012345678901234567890123456789
|
|
static char teng2[] =
|
|
"()((reasonab(l)e) line break. .01123=45x48.";
|
|
|
|
static PRUint32 exp2[] = {
|
|
2,12,15,17,18,22,23,24,30,31,37,38,
|
|
};
|
|
static PRUint32 wexp2[] = {
|
|
4,12,13,14,15,16,17,18,22,24,29,30,31,32,37,38,43
|
|
};
|
|
|
|
// 1 2 3 4 5 6 7
|
|
//01234567890123456789012345678901234567890123456789012345678901234567890123456789
|
|
static char teng3[] =
|
|
"It's a test to test(ronae ) line break....";
|
|
static PRUint32 exp3[] = {
|
|
4, 5, 6,7,11,12,14,15,19,25,27,28,32,33
|
|
};
|
|
static PRUint32 wexp3[] = {
|
|
4,5,6,7,11,12,14,15,19,20,25,26,27,28,32,33,38
|
|
};
|
|
|
|
static char ruler1[] =
|
|
" 1 2 3 4 5 6 7 ";
|
|
static char ruler2[] =
|
|
"0123456789012345678901234567890123456789012345678901234567890123456789012";
|
|
|
|
|
|
PRBool TestASCIILB(nsILineBreaker *lb,
|
|
const char* in, const PRUint32 len,
|
|
const PRUint32* out, PRUint32 outlen)
|
|
{
|
|
nsAutoString eng1; eng1.AssignWithConversion(in);
|
|
PRUint32 i,j;
|
|
PRUint32 res[256];
|
|
PRBool ok = PR_TRUE;
|
|
PRUint32 curr;
|
|
PRBool finishThisFrag = PR_FALSE;
|
|
for(i = 0, curr = 0; ((! finishThisFrag) && (i < 256)); i++)
|
|
{
|
|
lb->Next(eng1.GetUnicode(), eng1.Length(), curr,
|
|
&curr,
|
|
&finishThisFrag);
|
|
res [i] = curr;
|
|
|
|
}
|
|
if (i != outlen)
|
|
{
|
|
ok = PR_FALSE;
|
|
cout << "WARNING!!! return size wrong, expect " << outlen <<
|
|
" bet got " << i << "\n";
|
|
}
|
|
cout << "string = \n" << in << "\n";
|
|
cout << ruler1 << "\n";
|
|
cout << ruler2 << "\n";
|
|
cout << "Expect = \n";
|
|
for(j=0;j<outlen;j++)
|
|
{
|
|
cout << out[j] << ",";
|
|
}
|
|
cout << "\nResult = \n";
|
|
for(j=0;j<i;j++)
|
|
{
|
|
cout << res[j] << ",";
|
|
}
|
|
cout << "\n";
|
|
for(j=0;j<i;j++)
|
|
{
|
|
if(j < outlen)
|
|
{
|
|
if (res[j] != out[j])
|
|
{
|
|
ok = PR_FALSE;
|
|
cout << "[" << j << "] expect " << out[j] << " but got " <<
|
|
res[j] << "\n";
|
|
}
|
|
} else {
|
|
ok = PR_FALSE;
|
|
cout << "[" << j << "] additional " <<
|
|
res[j] << "\n";
|
|
|
|
}
|
|
}
|
|
return ok;
|
|
}
|
|
|
|
PRBool TestASCIIWB(nsIWordBreaker *lb,
|
|
const char* in, const PRUint32 len,
|
|
const PRUint32* out, PRUint32 outlen)
|
|
{
|
|
nsAutoString eng1; eng1.AssignWithConversion(in);
|
|
// nsBreakState bk(eng1.GetUnicode(), eng1.Length());
|
|
|
|
PRUint32 i,j;
|
|
PRUint32 res[256];
|
|
PRBool ok = PR_TRUE;
|
|
PRBool done;
|
|
PRUint32 curr =0;
|
|
|
|
for(i = 0, lb->Next(eng1.GetUnicode(), eng1.Length(), curr, &curr, &done);
|
|
(! done ) && (i < 256);
|
|
lb->Next(eng1.GetUnicode(), eng1.Length(), curr, &curr, &done), i++)
|
|
{
|
|
res [i] = curr;
|
|
}
|
|
if (i != outlen)
|
|
{
|
|
ok = PR_FALSE;
|
|
cout << "WARNING!!! return size wrong, expect " << outlen <<
|
|
" bet got " << i << "\n";
|
|
}
|
|
cout << "string = \n" << in << "\n";
|
|
cout << ruler1 << "\n";
|
|
cout << ruler2 << "\n";
|
|
cout << "Expect = \n";
|
|
for(j=0;j<outlen;j++)
|
|
{
|
|
cout << out[j] << ",";
|
|
}
|
|
cout << "\nResult = \n";
|
|
for(j=0;j<i;j++)
|
|
{
|
|
cout << res[j] << ",";
|
|
}
|
|
cout << "\n";
|
|
for(j=0;j<i;j++)
|
|
{
|
|
if(j < outlen)
|
|
{
|
|
if (res[j] != out[j])
|
|
{
|
|
ok = PR_FALSE;
|
|
cout << "[" << j << "] expect " << out[j] << " but got " <<
|
|
res[j] << "\n";
|
|
}
|
|
} else {
|
|
ok = PR_FALSE;
|
|
cout << "[" << j << "] additional " <<
|
|
res[j] << "\n";
|
|
|
|
}
|
|
}
|
|
return ok;
|
|
}
|
|
|
|
|
|
PRBool TestLineBreaker()
|
|
{
|
|
cout << "==================================\n";
|
|
cout << "Finish nsILineBreakerFactory Test \n";
|
|
cout << "==================================\n";
|
|
nsILineBreakerFactory *t = NULL;
|
|
nsresult res;
|
|
PRBool ok = PR_TRUE;
|
|
res = nsServiceManager::GetService(kLWBrkCID,
|
|
kILineBreakerFactory,
|
|
(nsISupports**) &t);
|
|
|
|
cout << "Test 1 - GetService():\n";
|
|
if(NS_FAILED(res) || ( t == NULL ) ) {
|
|
cout << "\t1st GetService failed\n";
|
|
ok = PR_FALSE;
|
|
} else {
|
|
#ifdef WORD_AROUND_SERVICE_MANAGER_ASSERT
|
|
res = nsServiceManager::ReleaseService(kLWBrkCID, t);
|
|
#endif
|
|
}
|
|
|
|
res = nsServiceManager::GetService(kLWBrkCID,
|
|
kILineBreakerFactory,
|
|
(nsISupports**) &t);
|
|
|
|
if(NS_FAILED(res) || ( t == NULL ) ) {
|
|
cout << "\t2nd GetService failed\n";
|
|
ok = PR_FALSE;
|
|
} else {
|
|
|
|
cout << "Test 3 - GetLineBreaker():\n";
|
|
nsILineBreaker *lb;
|
|
|
|
nsAutoString lb_arg;
|
|
res = t->GetBreaker(lb_arg, &lb);
|
|
if(NS_FAILED(res) || (lb == NULL)) {
|
|
cout << "GetBreaker(nsILineBreaker*) failed\n";
|
|
ok = PR_FALSE;
|
|
} else {
|
|
|
|
cout << "Test 4 - {First,Next}ForwardBreak():\n";
|
|
if( TestASCIILB(lb, teng1, sizeof(teng1)/sizeof(char),
|
|
exp1, sizeof(exp1)/sizeof(PRUint32)) )
|
|
{
|
|
cout << "Test 4 Passed\n\n";
|
|
} else {
|
|
ok = PR_FALSE;
|
|
cout << "Test 4 Failed\n\n";
|
|
}
|
|
|
|
cout << "Test 5 - {First,Next}ForwardBreak():\n";
|
|
if(TestASCIILB(lb, teng2, sizeof(teng2)/sizeof(char),
|
|
exp2, sizeof(exp2)/sizeof(PRUint32)) )
|
|
{
|
|
cout << "Test 5 Passed\n\n";
|
|
} else {
|
|
ok = PR_FALSE;
|
|
cout << "Test 5 Failed\n\n";
|
|
}
|
|
|
|
cout << "Test 6 - {First,Next}ForwardBreak():\n";
|
|
if(TestASCIILB(lb, teng3, sizeof(teng3)/sizeof(char),
|
|
exp3, sizeof(exp3)/sizeof(PRUint32)) )
|
|
{
|
|
cout << "Test 6 Passed\n\n";
|
|
} else {
|
|
ok = PR_FALSE;
|
|
cout << "Test 6 Failed\n\n";
|
|
}
|
|
|
|
|
|
NS_IF_RELEASE(lb);
|
|
}
|
|
|
|
#ifdef WORD_AROUND_SERVICE_MANAGER_ASSERT
|
|
res = nsServiceManager::ReleaseService(kLWBrkCID, t);
|
|
#endif
|
|
}
|
|
cout << "==================================\n";
|
|
cout << "Finish nsILineBreakerFactory Test \n";
|
|
cout << "==================================\n";
|
|
|
|
return ok;
|
|
}
|
|
|
|
PRBool TestWordBreaker()
|
|
{
|
|
cout << "==================================\n";
|
|
cout << "Finish nsIWordBreakerFactory Test \n";
|
|
cout << "==================================\n";
|
|
nsIWordBreakerFactory *t = NULL;
|
|
nsresult res;
|
|
PRBool ok = PR_TRUE;
|
|
res = nsServiceManager::GetService(kLWBrkCID,
|
|
kIWordBreakerFactory,
|
|
(nsISupports**) &t);
|
|
|
|
cout << "Test 1 - GetService():\n";
|
|
if(NS_FAILED(res) || ( t == NULL ) ) {
|
|
cout << "\t1st GetService failed\n";
|
|
ok = PR_FALSE;
|
|
} else {
|
|
res = nsServiceManager::ReleaseService(kLWBrkCID, t);
|
|
}
|
|
|
|
res = nsServiceManager::GetService(kLWBrkCID,
|
|
kIWordBreakerFactory,
|
|
(nsISupports**) &t);
|
|
|
|
if(NS_FAILED(res) || ( t == NULL ) ) {
|
|
cout << "\t2nd GetService failed\n";
|
|
ok = PR_FALSE;
|
|
} else {
|
|
|
|
cout << "Test 3 - GetWordBreaker():\n";
|
|
nsIWordBreaker *lb;
|
|
|
|
nsAutoString lb_arg;
|
|
res = t->GetBreaker(lb_arg, &lb);
|
|
if(NS_FAILED(res) || (lb == NULL)) {
|
|
cout << "GetBreaker(nsIWordBreaker*) failed\n";
|
|
ok = PR_FALSE;
|
|
} else {
|
|
|
|
cout << "Test 4 - {First,Next}ForwardBreak():\n";
|
|
if( TestASCIIWB(lb, teng1, sizeof(teng1)/sizeof(char),
|
|
wexp1, sizeof(wexp1)/sizeof(PRUint32)) )
|
|
{
|
|
cout << "Test 4 Passed\n\n";
|
|
} else {
|
|
ok = PR_FALSE;
|
|
cout << "Test 4 Failed\n\n";
|
|
}
|
|
|
|
cout << "Test 5 - {First,Next}ForwardBreak():\n";
|
|
if(TestASCIIWB(lb, teng2, sizeof(teng2)/sizeof(char),
|
|
wexp2, sizeof(wexp2)/sizeof(PRUint32)) )
|
|
{
|
|
cout << "Test 5 Passed\n\n";
|
|
} else {
|
|
ok = PR_FALSE;
|
|
cout << "Test 5 Failed\n\n";
|
|
}
|
|
|
|
cout << "Test 6 - {First,Next}ForwardBreak():\n";
|
|
if(TestASCIIWB(lb, teng3, sizeof(teng3)/sizeof(char),
|
|
wexp3, sizeof(wexp3)/sizeof(PRUint32)) )
|
|
{
|
|
cout << "Test 6 Passed\n\n";
|
|
} else {
|
|
ok = PR_FALSE;
|
|
cout << "Test 6 Failed\n\n";
|
|
}
|
|
|
|
|
|
NS_IF_RELEASE(lb);
|
|
}
|
|
|
|
res = nsServiceManager::ReleaseService(kLWBrkCID, t);
|
|
}
|
|
cout << "==================================\n";
|
|
cout << "Finish nsIWordBreakerFactory Test \n";
|
|
cout << "==================================\n";
|
|
|
|
return ok;
|
|
}
|
|
|
|
#ifdef XP_PC
|
|
#define LWBRK_DLL "lwbrk.dll"
|
|
#else
|
|
#ifdef XP_MAC
|
|
#define LWBRK_DLL "LWBRK_DLL"
|
|
#else
|
|
#endif
|
|
#define LWBRK_DLL "liblwbrk"MOZ_DLL_SUFFIX
|
|
#endif
|
|
|
|
extern "C" void NS_SetupRegistry()
|
|
{
|
|
nsComponentManager::RegisterComponent(kLWBrkCID, NULL, NULL, LWBRK_DLL, PR_FALSE, PR_FALSE);
|
|
}
|
|
|
|
void SamplePrintWordWithBreak();
|
|
void SampleFindWordBreakFromPosition(PRUint32 fragN, PRUint32 offset);
|
|
// Sample Code
|
|
|
|
// 012345678901234
|
|
static const char wb0[] = "T";
|
|
static const char wb1[] = "h";
|
|
static const char wb2[] = "is is a int";
|
|
static const char wb3[] = "ernationali";
|
|
static const char wb4[] = "zation work.";
|
|
|
|
static const char* wb[] = {wb0,wb1,wb2,wb3,wb4};
|
|
void SampleWordBreakUsage()
|
|
{
|
|
SamplePrintWordWithBreak();
|
|
SampleFindWordBreakFromPosition(0,0); // This
|
|
SampleFindWordBreakFromPosition(1,0); // This
|
|
SampleFindWordBreakFromPosition(2,0); // This
|
|
SampleFindWordBreakFromPosition(2,1); // This
|
|
SampleFindWordBreakFromPosition(2,9); // [space]
|
|
SampleFindWordBreakFromPosition(2,10); // internationalization
|
|
SampleFindWordBreakFromPosition(3,4); // internationalization
|
|
SampleFindWordBreakFromPosition(3,8); // internationalization
|
|
SampleFindWordBreakFromPosition(4,6); // [space]
|
|
SampleFindWordBreakFromPosition(4,7); // work
|
|
}
|
|
|
|
|
|
void SamplePrintWordWithBreak()
|
|
{
|
|
PRUint32 numOfFragment = sizeof(wb) / sizeof(char*);
|
|
nsIWordBreakerFactory *t = NULL;
|
|
|
|
nsresult res = nsServiceManager::GetService(kLWBrkCID,
|
|
kIWordBreakerFactory,
|
|
(nsISupports**) &t);
|
|
nsIWordBreaker *wbk;
|
|
|
|
nsAutoString wb_arg;
|
|
res = t->GetBreaker(wb_arg, &wbk);
|
|
|
|
nsAutoString result;
|
|
nsAutoString tmp;
|
|
|
|
for(PRUint32 i = 0; i < numOfFragment; i++)
|
|
{
|
|
nsAutoString fragText; fragText.AssignWithConversion(wb[i]);
|
|
// nsBreakState bk(fragText.GetUnicode(), fragText.Length());
|
|
|
|
PRUint32 cur = 0;
|
|
PRBool done;
|
|
res = wbk->Next(fragText.GetUnicode(), fragText.Length(), cur, &cur, &done);
|
|
PRUint32 start = 0;
|
|
for(PRUint32 j = 0; ! done ; j++)
|
|
{
|
|
tmp.SetLength(0);
|
|
fragText.Mid(tmp, start, cur - start);
|
|
result.Append(tmp);
|
|
result.AppendWithConversion("^");
|
|
start = cur;
|
|
wbk->Next(fragText.GetUnicode(), fragText.Length(), cur, &cur, &done);
|
|
}
|
|
|
|
tmp.SetLength(0);
|
|
fragText.Mid(tmp, start, fragText.Length() - start);
|
|
result.Append(tmp);
|
|
|
|
|
|
if( i != (numOfFragment -1 ))
|
|
{
|
|
nsAutoString nextFragText; nextFragText.AssignWithConversion(wb[i+1]);
|
|
|
|
PRBool canBreak = PR_TRUE;
|
|
res = wbk->BreakInBetween( fragText.GetUnicode(),
|
|
fragText.Length(),
|
|
nextFragText.GetUnicode(),
|
|
nextFragText.Length(),
|
|
&canBreak
|
|
);
|
|
if(canBreak)
|
|
result.AppendWithConversion("^");
|
|
|
|
fragText = nextFragText;
|
|
}
|
|
}
|
|
cout << "Output From SamplePrintWordWithBreak() \n\n";
|
|
cout << "[" << result.ToNewCString() << "]\n";
|
|
}
|
|
|
|
void SampleFindWordBreakFromPosition(PRUint32 fragN, PRUint32 offset)
|
|
{
|
|
PRUint32 numOfFragment = sizeof(wb) / sizeof(char*);
|
|
nsIWordBreakerFactory *t = NULL;
|
|
|
|
nsresult res = nsServiceManager::GetService(kLWBrkCID,
|
|
kIWordBreakerFactory,
|
|
(nsISupports**) &t);
|
|
nsIWordBreaker *wbk;
|
|
|
|
nsAutoString wb_arg;
|
|
res = t->GetBreaker(wb_arg, &wbk);
|
|
|
|
|
|
nsAutoString fragText; fragText.AssignWithConversion(wb[fragN]);
|
|
|
|
PRUint32 begin, end;
|
|
|
|
|
|
nsAutoString result;
|
|
res = wbk->FindWord(fragText.GetUnicode(), fragText.Length(),
|
|
offset, &begin, &end);
|
|
|
|
PRBool canbreak;
|
|
fragText.Mid(result, begin, end-begin);
|
|
|
|
if((PRUint32)fragText.Length() == end) // if we hit the end of the fragment
|
|
{
|
|
nsAutoString curFragText = fragText;
|
|
for(PRUint32 p = fragN +1; p < numOfFragment ;p++)
|
|
{
|
|
nsAutoString nextFragText; nextFragText.AssignWithConversion(wb[p]);
|
|
res = wbk->BreakInBetween(curFragText.GetUnicode(),
|
|
curFragText.Length(),
|
|
nextFragText.GetUnicode(),
|
|
nextFragText.Length(),
|
|
&canbreak);
|
|
if(canbreak)
|
|
break;
|
|
|
|
PRUint32 b, e;
|
|
res = wbk->FindWord(nextFragText.GetUnicode(), nextFragText.Length(),
|
|
0, &b, &e);
|
|
|
|
nsAutoString tmp;
|
|
nextFragText.Mid(tmp,b,e-b);
|
|
result.Append(tmp);
|
|
|
|
if((PRUint32)nextFragText.Length() != e)
|
|
break;
|
|
|
|
nextFragText = curFragText;
|
|
}
|
|
}
|
|
|
|
if(0 == begin) // if we hit the beginning of the fragment
|
|
{
|
|
nsAutoString curFragText = fragText;
|
|
for(PRUint32 p = fragN ; p > 0 ;p--)
|
|
{
|
|
nsAutoString prevFragText; prevFragText.AssignWithConversion(wb[p-1]);
|
|
res = wbk->BreakInBetween(prevFragText.GetUnicode(),
|
|
prevFragText.Length(),
|
|
curFragText.GetUnicode(),
|
|
curFragText.Length(),
|
|
&canbreak);
|
|
if(canbreak)
|
|
break;
|
|
|
|
PRUint32 b, e;
|
|
res = wbk->FindWord(prevFragText.GetUnicode(), prevFragText.Length(),
|
|
prevFragText.Length(), &b, &e);
|
|
|
|
nsAutoString tmp;
|
|
prevFragText.Mid(tmp,b,e-b);
|
|
result.Insert(tmp,0);
|
|
|
|
if(0 != b)
|
|
break;
|
|
|
|
prevFragText = curFragText;
|
|
}
|
|
}
|
|
|
|
cout << "Output From SamplePrintWordWithBreak() \n\n";
|
|
cout << "[" << result.ToNewCString() << "]\n";
|
|
}
|
|
|
|
// Main
|
|
|
|
int main(int argc, char** argv) {
|
|
|
|
NS_SetupRegistry();
|
|
|
|
// --------------------------------------------
|
|
cout << "Test Line Break\n";
|
|
|
|
PRBool lbok ;
|
|
PRBool wbok ;
|
|
lbok =TestWordBreaker();
|
|
if(lbok)
|
|
cout << "Line Break Test\nOK\n";
|
|
else
|
|
cout << "Line Break Test\nFailed\n";
|
|
|
|
wbok = TestLineBreaker();
|
|
if(wbok)
|
|
cout << "Word Break Test\nOK\n";
|
|
else
|
|
cout << "Word Break Test\nFailed\n";
|
|
|
|
SampleWordBreakUsage();
|
|
|
|
|
|
// --------------------------------------------
|
|
cout << "Finish All The Test Cases\n";
|
|
nsresult res = NS_OK;
|
|
res = nsComponentManager::FreeLibraries();
|
|
|
|
if(NS_FAILED(res))
|
|
cout << "nsComponentManager failed\n";
|
|
else
|
|
cout << "nsComponentManager FreeLibraries Done\n";
|
|
if(lbok && wbok)
|
|
cout << "Line/Word Break Test\nOK\n";
|
|
else
|
|
cout << "Line/Word Break Test\nFailed\n";
|
|
return 0;
|
|
}
|