RetroZilla/intl/lwbrk/tests/TestLineBreak.cpp
2015-10-20 23:03:22 -04:00

581 lines
17 KiB
C++

/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
/* ***** BEGIN LICENSE BLOCK *****
* Version: MPL 1.1/GPL 2.0/LGPL 2.1
*
* The contents of this file are subject to the Mozilla Public License Version
* 1.1 (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
* http://www.mozilla.org/MPL/
*
* Software distributed under the License is distributed on an "AS IS" basis,
* WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
* for the specific language governing rights and limitations under the
* License.
*
* The Original Code is mozilla.org code.
*
* The Initial Developer of the Original Code is
* Netscape Communications Corporation.
* Portions created by the Initial Developer are Copyright (C) 1998
* the Initial Developer. All Rights Reserved.
*
* Contributor(s):
*
* Alternatively, the contents of this file may be used under the terms of
* either of the GNU General Public License Version 2 or later (the "GPL"),
* or the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
* in which case the provisions of the GPL or the LGPL are applicable instead
* of those above. If you wish to allow use of your version of this file only
* under the terms of either the GPL or the LGPL, and not to allow others to
* use your version of this file under the terms of the MPL, indicate your
* decision by deleting the provisions above and replace them with the notice
* and other provisions required by the GPL or the LGPL. If you do not delete
* the provisions above, a recipient may use your version of this file under
* the terms of any one of the MPL, the GPL or the LGPL.
*
* ***** END LICENSE BLOCK ***** */
#include <stdio.h>
#include "nsXPCOM.h"
#include "nsIComponentManager.h"
#include "nsISupports.h"
#include "nsServiceManagerUtils.h"
#include "nsILineBreakerFactory.h"
#include "nsILineBreaker.h"
#include "nsIWordBreakerFactory.h"
#include "nsIWordBreaker.h"
#include "nsIBreakState.h"
#include "nsLWBrkCIID.h"
#include "nsReadableUtils.h"
#define WORK_AROUND_SERVICE_MANAGER_ASSERT
IMPL_NS_IBREAKSTATE( nsBreakState )
NS_DEFINE_CID(kLWBrkCID, NS_LWBRK_CID);
static char teng1[] =
// 1 2 3 4 5 6 7
//01234567890123456789012345678901234567890123456789012345678901234567890123456789
"This is a test to test(reasonable) line break. This 0.01123 = 45 x 48.";
static PRUint32 exp1[] = {
4,5,7,8,9,10,14,15,17,18,22,34,35,39,40,41,42,43,49,50,54,55,62,63,64,65,
67,68,69,70
};
static PRUint32 wexp1[] = {
4,5,7,8,9,10,14,15,17,18,22,23,33,34,35,39,43,48,49,50,54,55,56,57,62,63,
64,65,67,68,69,70,72
};
// 1 2 3 4 5 6 7
//01234567890123456789012345678901234567890123456789012345678901234567890123456789
static char teng2[] =
"()((reasonab(l)e) line break. .01123=45x48.";
static PRUint32 lexp2[] = {
2,12,15,17,18,22,23,24,30,31,37,38,
};
static PRUint32 wexp2[] = {
4,12,13,14,15,16,17,18,22,24,29,30,31,32,37,38,43
};
// 1 2 3 4 5 6 7
//01234567890123456789012345678901234567890123456789012345678901234567890123456789
static char teng3[] =
"It's a test to test(ronae ) line break....";
static PRUint32 exp3[] = {
4, 5, 6,7,11,12,14,15,19,25,27,28,32,33
};
static PRUint32 wexp3[] = {
4,5,6,7,11,12,14,15,19,20,25,26,27,28,32,33,38
};
static char ruler1[] =
" 1 2 3 4 5 6 7 ";
static char ruler2[] =
"0123456789012345678901234567890123456789012345678901234567890123456789012";
PRBool TestASCIILB(nsILineBreaker *lb,
const char* in, const PRUint32 len,
const PRUint32* out, PRUint32 outlen)
{
nsAutoString eng1; eng1.AssignWithConversion(in);
PRUint32 i,j;
PRUint32 res[256];
PRBool ok = PR_TRUE;
PRUint32 curr;
PRBool finishThisFrag = PR_FALSE;
for(i = 0, curr = 0; ((! finishThisFrag) && (i < 256)); i++)
{
lb->Next(eng1.get(), eng1.Length(), curr,
&curr,
&finishThisFrag);
res [i] = curr;
}
if (i != outlen)
{
ok = PR_FALSE;
printf("WARNING!!! return size wrong, expect %d bet got %d \n",
outlen, i);
}
printf("string = \n%s\n", in);
printf("%s\n", ruler1);
printf("%s\n", ruler2);
printf("Expect = \n");
for(j=0;j<outlen;j++)
{
printf("%d,", out[j]);
}
printf("\nResult = \n");
for(j=0;j<i;j++)
{
printf("%d,", res[j]);
}
printf("\n");
for(j=0;j<i;j++)
{
if(j < outlen)
{
if (res[j] != out[j])
{
ok = PR_FALSE;
printf("[%d] expect %d but got %d\n", j, out[j], res[j]);
}
} else {
ok = PR_FALSE;
printf("[%d] additional %d\n", j, res[j]);
}
}
return ok;
}
PRBool TestASCIIWB(nsIWordBreaker *lb,
const char* in, const PRUint32 len,
const PRUint32* out, PRUint32 outlen)
{
nsAutoString eng1; eng1.AssignWithConversion(in);
// nsBreakState bk(eng1.get(), eng1.Length());
PRUint32 i,j;
PRUint32 res[256];
PRBool ok = PR_TRUE;
PRBool done;
PRUint32 curr =0;
for(i = 0, lb->NextWord(eng1.get(), eng1.Length(), curr, &curr, &done);
(! done ) && (i < 256);
lb->NextWord(eng1.get(), eng1.Length(), curr, &curr, &done), i++)
{
res [i] = curr;
}
if (i != outlen)
{
ok = PR_FALSE;
printf("WARNING!!! return size wrong, expect %d bet got %d\n",
outlen, i);
}
printf("string = \n%s\n", in);
printf("%s\n", ruler1);
printf("%s\n", ruler2);
printf("Expect = \n");
for(j=0;j<outlen;j++)
{
printf("%d,", out[j]);
}
printf("\nResult = \n");
for(j=0;j<i;j++)
{
printf("%d,", res[j]);
}
printf("\n");
for(j=0;j<i;j++)
{
if(j < outlen)
{
if (res[j] != out[j])
{
ok = PR_FALSE;
printf("[%d] expect %d but got %d\n", j, out[j], res[j]);
}
} else {
ok = PR_FALSE;
printf("[%d] additional %d\n", j, res[j]);
}
}
return ok;
}
PRBool TestLineBreaker()
{
printf("==================================\n");
printf("Finish nsILineBreakerFactory Test \n");
printf("==================================\n");
nsILineBreakerFactory *t = NULL;
nsresult res;
PRBool ok = PR_TRUE;
res = CallGetService(kLWBrkCID, &t);
printf("Test 1 - GetService():\n");
if(NS_FAILED(res) || ( t == NULL ) ) {
printf("\t1st GetService failed\n");
ok = PR_FALSE;
} else {
#ifdef WORD_AROUND_SERVICE_MANAGER_ASSERT
NS_RELEASE(t);
#endif
}
res = CallGetService(kLWBrkCID, &t);
if(NS_FAILED(res) || ( t == NULL ) ) {
printf("\t2nd GetService failed\n");
ok = PR_FALSE;
} else {
printf("Test 3 - GetLineBreaker():\n");
nsILineBreaker *lb;
nsAutoString lb_arg;
res = t->GetBreaker(lb_arg, &lb);
if(NS_FAILED(res) || (lb == NULL)) {
printf("GetBreaker(nsILineBreaker*) failed\n");
ok = PR_FALSE;
} else {
printf("Test 4 - {First,Next}ForwardBreak():\n");
if( TestASCIILB(lb, teng1, sizeof(teng1)/sizeof(char),
exp1, sizeof(exp1)/sizeof(PRUint32)) )
{
printf("Test 4 Passed\n\n");
} else {
ok = PR_FALSE;
printf("Test 4 Failed\n\n");
}
printf("Test 5 - {First,Next}ForwardBreak():\n");
if(TestASCIILB(lb, teng2, sizeof(teng2)/sizeof(char),
lexp2, sizeof(lexp2)/sizeof(PRUint32)) )
{
printf("Test 5 Passed\n\n");
} else {
ok = PR_FALSE;
printf("Test 5 Failed\n\n");
}
printf("Test 6 - {First,Next}ForwardBreak():\n");
if(TestASCIILB(lb, teng3, sizeof(teng3)/sizeof(char),
exp3, sizeof(exp3)/sizeof(PRUint32)) )
{
printf("Test 6 Passed\n\n");
} else {
ok = PR_FALSE;
printf("Test 6 Failed\n\n");
}
NS_IF_RELEASE(lb);
}
#ifdef WORD_AROUND_SERVICE_MANAGER_ASSERT
NS_RELEASE(t);
#endif
}
printf("==================================\n");
printf("Finish nsILineBreakerFactory Test \n");
printf("==================================\n");
return ok;
}
PRBool TestWordBreaker()
{
printf("==================================\n");
printf("Finish nsIWordBreakerFactory Test \n");
printf("==================================\n");
nsIWordBreakerFactory *t = NULL;
nsresult res;
PRBool ok = PR_TRUE;
res = CallGetService(kLWBrkCID, &t);
printf("Test 1 - GetService():\n");
if(NS_FAILED(res) || ( t == NULL ) ) {
printf("\t1st GetService failed\n");
ok = PR_FALSE;
} else {
NS_RELEASE(t);
}
res = CallGetService(kLWBrkCID, &t);
if(NS_FAILED(res) || ( t == NULL ) ) {
printf("\t2nd GetService failed\n");
ok = PR_FALSE;
} else {
printf("Test 3 - GetWordBreaker():\n");
nsIWordBreaker *lb;
nsAutoString lb_arg;
res = t->GetBreaker(lb_arg, &lb);
if(NS_FAILED(res) || (lb == NULL)) {
printf("GetBreaker(nsIWordBreaker*) failed\n");
ok = PR_FALSE;
} else {
printf("Test 4 - {First,Next}ForwardBreak():\n");
if( TestASCIIWB(lb, teng1, sizeof(teng1)/sizeof(char),
wexp1, sizeof(wexp1)/sizeof(PRUint32)) )
{
printf("Test 4 Passed\n\n");
} else {
ok = PR_FALSE;
printf("Test 4 Failed\n\n");
}
printf("Test 5 - {First,Next}ForwardBreak():\n");
if(TestASCIIWB(lb, teng2, sizeof(teng2)/sizeof(char),
wexp2, sizeof(wexp2)/sizeof(PRUint32)) )
{
printf("Test 5 Passed\n\n");
} else {
ok = PR_FALSE;
printf("Test 5 Failed\n\n");
}
printf("Test 6 - {First,Next}ForwardBreak():\n");
if(TestASCIIWB(lb, teng3, sizeof(teng3)/sizeof(char),
wexp3, sizeof(wexp3)/sizeof(PRUint32)) )
{
printf("Test 6 Passed\n\n");
} else {
ok = PR_FALSE;
printf("Test 6 Failed\n\n");
}
NS_IF_RELEASE(lb);
}
NS_RELEASE(t);
}
printf("==================================\n");
printf("Finish nsIWordBreakerFactory Test \n");
printf("==================================\n");
return ok;
}
void SamplePrintWordWithBreak();
void SampleFindWordBreakFromPosition(PRUint32 fragN, PRUint32 offset);
// Sample Code
// 012345678901234
static const char wb0[] = "T";
static const char wb1[] = "h";
static const char wb2[] = "is is a int";
static const char wb3[] = "ernationali";
static const char wb4[] = "zation work.";
static const char* wb[] = {wb0,wb1,wb2,wb3,wb4};
void SampleWordBreakUsage()
{
SamplePrintWordWithBreak();
SampleFindWordBreakFromPosition(0,0); // This
SampleFindWordBreakFromPosition(1,0); // This
SampleFindWordBreakFromPosition(2,0); // This
SampleFindWordBreakFromPosition(2,1); // This
SampleFindWordBreakFromPosition(2,9); // [space]
SampleFindWordBreakFromPosition(2,10); // internationalization
SampleFindWordBreakFromPosition(3,4); // internationalization
SampleFindWordBreakFromPosition(3,8); // internationalization
SampleFindWordBreakFromPosition(4,6); // [space]
SampleFindWordBreakFromPosition(4,7); // work
}
void SamplePrintWordWithBreak()
{
PRUint32 numOfFragment = sizeof(wb) / sizeof(char*);
nsIWordBreakerFactory *t = NULL;
nsresult res = CallGetService(kLWBrkCID, &t);
nsIWordBreaker *wbk;
nsAutoString wb_arg;
res = t->GetBreaker(wb_arg, &wbk);
nsAutoString result;
nsAutoString tmp;
for(PRUint32 i = 0; i < numOfFragment; i++)
{
nsAutoString fragText; fragText.AssignWithConversion(wb[i]);
// nsBreakState bk(fragText.get(), fragText.Length());
PRUint32 cur = 0;
PRBool done;
res = wbk->NextWord(fragText.get(), fragText.Length(), cur, &cur, &done);
PRUint32 start = 0;
for(PRUint32 j = 0; ! done ; j++)
{
tmp.Truncate();
fragText.Mid(tmp, start, cur - start);
result.Append(tmp);
result.AppendLiteral("^");
start = cur;
wbk->NextWord(fragText.get(), fragText.Length(), cur, &cur, &done);
}
tmp.Truncate();
fragText.Mid(tmp, start, fragText.Length() - start);
result.Append(tmp);
if( i != (numOfFragment -1 ))
{
nsAutoString nextFragText; nextFragText.AssignWithConversion(wb[i+1]);
PRBool canBreak = PR_TRUE;
res = wbk->BreakInBetween( fragText.get(),
fragText.Length(),
nextFragText.get(),
nextFragText.Length(),
&canBreak
);
if(canBreak)
result.AppendLiteral("^");
fragText = nextFragText;
}
}
printf("Output From SamplePrintWordWithBreak() \n\n");
printf("[%s]\n", NS_LossyConvertUCS2toASCII(result).get());
}
void SampleFindWordBreakFromPosition(PRUint32 fragN, PRUint32 offset)
{
PRUint32 numOfFragment = sizeof(wb) / sizeof(char*);
nsIWordBreakerFactory *t = NULL;
nsresult res = CallGetService(kLWBrkCID, &t);
nsIWordBreaker *wbk;
nsAutoString wb_arg;
res = t->GetBreaker(wb_arg, &wbk);
nsAutoString fragText; fragText.AssignWithConversion(wb[fragN]);
PRUint32 begin, end;
nsAutoString result;
res = wbk->FindWord(fragText.get(), fragText.Length(),
offset, &begin, &end);
PRBool canbreak;
fragText.Mid(result, begin, end-begin);
if((PRUint32)fragText.Length() == end) // if we hit the end of the fragment
{
nsAutoString curFragText = fragText;
for(PRUint32 p = fragN +1; p < numOfFragment ;p++)
{
nsAutoString nextFragText; nextFragText.AssignWithConversion(wb[p]);
res = wbk->BreakInBetween(curFragText.get(),
curFragText.Length(),
nextFragText.get(),
nextFragText.Length(),
&canbreak);
if(canbreak)
break;
PRUint32 b, e;
res = wbk->FindWord(nextFragText.get(), nextFragText.Length(),
0, &b, &e);
nsAutoString tmp;
nextFragText.Mid(tmp,b,e-b);
result.Append(tmp);
if((PRUint32)nextFragText.Length() != e)
break;
nextFragText = curFragText;
}
}
if(0 == begin) // if we hit the beginning of the fragment
{
nsAutoString curFragText = fragText;
for(PRUint32 p = fragN ; p > 0 ;p--)
{
nsAutoString prevFragText; prevFragText.AssignWithConversion(wb[p-1]);
res = wbk->BreakInBetween(prevFragText.get(),
prevFragText.Length(),
curFragText.get(),
curFragText.Length(),
&canbreak);
if(canbreak)
break;
PRUint32 b, e;
res = wbk->FindWord(prevFragText.get(), prevFragText.Length(),
prevFragText.Length(), &b, &e);
nsAutoString tmp;
prevFragText.Mid(tmp,b,e-b);
result.Insert(tmp,0);
if(0 != b)
break;
prevFragText = curFragText;
}
}
printf("Output From SamplePrintWordWithBreak() \n\n");
printf("[%s]\n", NS_LossyConvertUCS2toASCII(result).get());
}
// Main
int main(int argc, char** argv) {
NS_InitXPCOM2(nsnull, nsnull, nsnull);
// --------------------------------------------
printf("Test Line Break\n");
PRBool lbok ;
PRBool wbok ;
lbok =TestWordBreaker();
if(lbok)
printf("Line Break Test\nOK\n");
else
printf("Line Break Test\nFailed\n");
wbok = TestLineBreaker();
if(wbok)
printf("Word Break Test\nOK\n");
else
printf("Word Break Test\nFailed\n");
SampleWordBreakUsage();
// --------------------------------------------
printf("Finish All The Test Cases\n");
if(lbok && wbok)
printf("Line/Word Break Test\nOK\n");
else
printf("Line/Word Break Test\nFailed\n");
return 0;
}