src/third_party/icu/source/test/intltest/tstnrapi.cpp - cobalt - Git at Google

 /********************************************************************
  * COPYRIGHT:
  * Copyright (c) 1997-2010, International Business Machines Corporation and
  * others. All Rights Reserved.
  ********************************************************************/

 #include "unicode/utypes.h"
 #include "unicode/uchar.h"
 #include "unicode/normlzr.h"
 #include "unicode/uniset.h"
 #include "unicode/usetiter.h"
 #include "unicode/schriter.h"
 #include "tstnorm.h"

 #if !UCONFIG_NO_NORMALIZATION

 static UErrorCode status = U_ZERO_ERROR;

 // test APIs that are not otherwise used - improve test coverage
 void
 BasicNormalizerTest::TestNormalizerAPI() {
     // instantiate a Normalizer from a CharacterIterator
     UnicodeString s=UnicodeString("a\\u0308\\uac00\\U0002f800", "").unescape();
     s.append(s); // make s a bit longer and more interesting
     StringCharacterIterator iter(s);
     Normalizer norm(iter, UNORM_NFC);
     if(norm.next()!=0xe4) {
         dataerrln("error in Normalizer(CharacterIterator).next()");
     }

     // test copy constructor
     Normalizer copy(norm);
     if(copy.next()!=0xac00) {
         dataerrln("error in Normalizer(Normalizer(CharacterIterator)).next()");
     }

     // test clone(), ==, and hashCode()
     Normalizer *clone=copy.clone();
     if(*clone!=copy) {
         errln("error in Normalizer(Normalizer(CharacterIterator)).clone()!=copy");
     }
     // clone must have the same hashCode()
     if(clone->hashCode()!=copy.hashCode()) {
         errln("error in Normalizer(Normalizer(CharacterIterator)).clone()->hashCode()!=copy.hashCode()");
     }
     if(clone->next()!=0x4e3d) {
         dataerrln("error in Normalizer(Normalizer(CharacterIterator)).clone()->next()");
     }
     // position changed, must change hashCode()
     if(clone->hashCode()==copy.hashCode()) {
         errln("error in Normalizer(Normalizer(CharacterIterator)).clone()->next().hashCode()==copy.hashCode()");
     }
     delete clone;
     clone=0;

     // test compose() and decompose()
     UnicodeString tel, nfkc, nfkd;
     tel=UnicodeString(1, (UChar32)0x2121, 10);
     tel.insert(1, (UChar)0x301);

     UErrorCode errorCode=U_ZERO_ERROR;
     Normalizer::compose(tel, TRUE, 0, nfkc, errorCode);
     Normalizer::decompose(tel, TRUE, 0, nfkd, errorCode);
     if(U_FAILURE(errorCode)) {
         dataerrln("error in Normalizer::(de)compose(): %s", u_errorName(errorCode));
     } else if(
         nfkc!=UnicodeString("TE\\u0139TELTELTELTELTELTELTELTELTEL", "").unescape() ||
         nfkd!=UnicodeString("TEL\\u0301TELTELTELTELTELTELTELTELTEL", "").unescape()
     ) {
         errln("error in Normalizer::(de)compose(): wrong result(s)");
     }

     // test setIndex()
     norm.setIndexOnly(3);
     if(norm.current()!=0x4e3d) {
         dataerrln("error in Normalizer(CharacterIterator).setIndex(3)");
     }

     // test setText(CharacterIterator) and getText()
     UnicodeString out, out2;
     errorCode=U_ZERO_ERROR;
     copy.setText(iter, errorCode);
     if(U_FAILURE(errorCode)) {
         errln("error Normalizer::setText() failed: %s", u_errorName(errorCode));
     } else {
         copy.getText(out);
         iter.getText(out2);
         if( out!=out2 ||
             copy.startIndex()!=iter.startIndex() ||
             copy.endIndex()!=iter.endIndex()
         ) {
             errln("error in Normalizer::setText() or Normalizer::getText()");
         }
     }

     // test setText(UChar *), getUMode() and setMode()
     errorCode=U_ZERO_ERROR;
     copy.setText(s.getBuffer()+1, s.length()-1, errorCode);
     copy.setMode(UNORM_NFD);
     if(copy.getUMode()!=UNORM_NFD) {
         errln("error in Normalizer::setMode() or Normalizer::getUMode()");
     }
     if(copy.next()!=0x308 || copy.next()!=0x1100) {
         dataerrln("error in Normalizer::setText(UChar *) or Normalizer::setMode()");
     }

     // test setText(UChar *, length=-1)
     errorCode=U_ZERO_ERROR;

     // NUL-terminate s
     s.append((UChar)0);         // append NUL
     s.truncate(s.length()-1);   // undo length change

     copy.setText(s.getBuffer()+1, -1, errorCode);
     if(copy.endIndex()!=s.length()-1) {
         errln("error in Normalizer::setText(UChar *, -1)");
     }

     // test setOption() and getOption()
     copy.setOption(0xaa0000, TRUE);
     copy.setOption(0x20000, FALSE);
     if(!copy.getOption(0x880000) || copy.getOption(0x20000)) {
         errln("error in Normalizer::setOption() or Normalizer::getOption()");
     }

     // test last()/previous() with an internal buffer overflow
     errorCode=U_ZERO_ERROR;
     copy.setText(UnicodeString(1000, (UChar32)0x308, 1000), errorCode);
     if(copy.last()!=0x308) {
         errln("error in Normalizer(1000*U+0308).last()");
     }

     // test UNORM_NONE
     norm.setMode(UNORM_NONE);
     if(norm.first()!=0x61 || norm.next()!=0x308 || norm.last()!=0x2f800) {
         errln("error in Normalizer(UNORM_NONE).first()/next()/last()");
     }
     Normalizer::normalize(s, UNORM_NONE, 0, out, status);
     if(out!=s) {
         errln("error in Normalizer::normalize(UNORM_NONE)");
     }

     // test that the same string can be used as source and destination
     s.setTo((UChar)0xe4);
     Normalizer::normalize(s, UNORM_NFD, 0, s, status);
     if(s.charAt(1)!=0x308) {
         dataerrln("error in Normalizer::normalize(UNORM_NFD, self)");
     }
     Normalizer::normalize(s, UNORM_NFC, 0, s, status);
     if(s.charAt(0)!=0xe4) {
         dataerrln("error in Normalizer::normalize(UNORM_NFC, self)");
     }
     Normalizer::decompose(s, FALSE, 0, s, status);
     if(s.charAt(1)!=0x308) {
         dataerrln("error in Normalizer::decompose(self)");
     }
     Normalizer::compose(s, FALSE, 0, s, status);
     if(s.charAt(0)!=0xe4) {
         dataerrln("error in Normalizer::compose(self)");
     }
     Normalizer::concatenate(s, s, s, UNORM_NFC, 0, status);
     if(s.charAt(1)!=0xe4) {
         dataerrln("error in Normalizer::decompose(self)");
     }
 }

 #endif
	/********************************************************************
	* COPYRIGHT:
	* Copyright (c) 1997-2010, International Business Machines Corporation and
	* others. All Rights Reserved.
	********************************************************************/

	#include "unicode/utypes.h"
	#include "unicode/uchar.h"
	#include "unicode/normlzr.h"
	#include "unicode/uniset.h"
	#include "unicode/usetiter.h"
	#include "unicode/schriter.h"
	#include "tstnorm.h"

	#if !UCONFIG_NO_NORMALIZATION

	static UErrorCode status = U_ZERO_ERROR;

	// test APIs that are not otherwise used - improve test coverage
	void
	BasicNormalizerTest::TestNormalizerAPI() {
	// instantiate a Normalizer from a CharacterIterator
	UnicodeString s=UnicodeString("a\\u0308\\uac00\\U0002f800", "").unescape();
	s.append(s); // make s a bit longer and more interesting
	StringCharacterIterator iter(s);
	Normalizer norm(iter, UNORM_NFC);
	if(norm.next()!=0xe4) {
	dataerrln("error in Normalizer(CharacterIterator).next()");
	}

	// test copy constructor
	Normalizer copy(norm);
	if(copy.next()!=0xac00) {
	dataerrln("error in Normalizer(Normalizer(CharacterIterator)).next()");
	}

	// test clone(), ==, and hashCode()
	Normalizer *clone=copy.clone();
	if(*clone!=copy) {
	errln("error in Normalizer(Normalizer(CharacterIterator)).clone()!=copy");
	}
	// clone must have the same hashCode()
	if(clone->hashCode()!=copy.hashCode()) {
	errln("error in Normalizer(Normalizer(CharacterIterator)).clone()->hashCode()!=copy.hashCode()");
	}
	if(clone->next()!=0x4e3d) {
	dataerrln("error in Normalizer(Normalizer(CharacterIterator)).clone()->next()");
	}
	// position changed, must change hashCode()
	if(clone->hashCode()==copy.hashCode()) {
	errln("error in Normalizer(Normalizer(CharacterIterator)).clone()->next().hashCode()==copy.hashCode()");
	}
	delete clone;
	clone=0;

	// test compose() and decompose()
	UnicodeString tel, nfkc, nfkd;
	tel=UnicodeString(1, (UChar32)0x2121, 10);
	tel.insert(1, (UChar)0x301);

	UErrorCode errorCode=U_ZERO_ERROR;
	Normalizer::compose(tel, TRUE, 0, nfkc, errorCode);
	Normalizer::decompose(tel, TRUE, 0, nfkd, errorCode);
	if(U_FAILURE(errorCode)) {
	dataerrln("error in Normalizer::(de)compose(): %s", u_errorName(errorCode));
	} else if(
	nfkc!=UnicodeString("TE\\u0139TELTELTELTELTELTELTELTELTEL", "").unescape() \|\|
	nfkd!=UnicodeString("TEL\\u0301TELTELTELTELTELTELTELTELTEL", "").unescape()
	) {
	errln("error in Normalizer::(de)compose(): wrong result(s)");
	}

	// test setIndex()
	norm.setIndexOnly(3);
	if(norm.current()!=0x4e3d) {
	dataerrln("error in Normalizer(CharacterIterator).setIndex(3)");
	}

	// test setText(CharacterIterator) and getText()
	UnicodeString out, out2;
	errorCode=U_ZERO_ERROR;
	copy.setText(iter, errorCode);
	if(U_FAILURE(errorCode)) {
	errln("error Normalizer::setText() failed: %s", u_errorName(errorCode));
	} else {
	copy.getText(out);
	iter.getText(out2);
	if( out!=out2 \|\|
	copy.startIndex()!=iter.startIndex() \|\|
	copy.endIndex()!=iter.endIndex()
	) {
	errln("error in Normalizer::setText() or Normalizer::getText()");
	}
	}

	// test setText(UChar *), getUMode() and setMode()
	errorCode=U_ZERO_ERROR;
	copy.setText(s.getBuffer()+1, s.length()-1, errorCode);
	copy.setMode(UNORM_NFD);
	if(copy.getUMode()!=UNORM_NFD) {
	errln("error in Normalizer::setMode() or Normalizer::getUMode()");
	}
	if(copy.next()!=0x308 \|\| copy.next()!=0x1100) {
	dataerrln("error in Normalizer::setText(UChar *) or Normalizer::setMode()");
	}

	// test setText(UChar *, length=-1)
	errorCode=U_ZERO_ERROR;

	// NUL-terminate s
	s.append((UChar)0); // append NUL
	s.truncate(s.length()-1); // undo length change

	copy.setText(s.getBuffer()+1, -1, errorCode);
	if(copy.endIndex()!=s.length()-1) {
	errln("error in Normalizer::setText(UChar *, -1)");
	}

	// test setOption() and getOption()
	copy.setOption(0xaa0000, TRUE);
	copy.setOption(0x20000, FALSE);
	if(!copy.getOption(0x880000) \|\| copy.getOption(0x20000)) {
	errln("error in Normalizer::setOption() or Normalizer::getOption()");
	}

	// test last()/previous() with an internal buffer overflow
	errorCode=U_ZERO_ERROR;
	copy.setText(UnicodeString(1000, (UChar32)0x308, 1000), errorCode);
	if(copy.last()!=0x308) {
	errln("error in Normalizer(1000*U+0308).last()");
	}

	// test UNORM_NONE
	norm.setMode(UNORM_NONE);
	if(norm.first()!=0x61 \|\| norm.next()!=0x308 \|\| norm.last()!=0x2f800) {
	errln("error in Normalizer(UNORM_NONE).first()/next()/last()");
	}
	Normalizer::normalize(s, UNORM_NONE, 0, out, status);
	if(out!=s) {
	errln("error in Normalizer::normalize(UNORM_NONE)");
	}

	// test that the same string can be used as source and destination
	s.setTo((UChar)0xe4);
	Normalizer::normalize(s, UNORM_NFD, 0, s, status);
	if(s.charAt(1)!=0x308) {
	dataerrln("error in Normalizer::normalize(UNORM_NFD, self)");
	}
	Normalizer::normalize(s, UNORM_NFC, 0, s, status);
	if(s.charAt(0)!=0xe4) {
	dataerrln("error in Normalizer::normalize(UNORM_NFC, self)");
	}
	Normalizer::decompose(s, FALSE, 0, s, status);
	if(s.charAt(1)!=0x308) {
	dataerrln("error in Normalizer::decompose(self)");
	}
	Normalizer::compose(s, FALSE, 0, s, status);
	if(s.charAt(0)!=0xe4) {
	dataerrln("error in Normalizer::compose(self)");
	}
	Normalizer::concatenate(s, s, s, UNORM_NFC, 0, status);
	if(s.charAt(1)!=0xe4) {
	dataerrln("error in Normalizer::decompose(self)");
	}
	}

	#endif