blob: 21c1af5a57cbfb6f9a6f7cf72e8cb825551bcd60 [file] [log] [blame]
/*
***************************************************************************
* Copyright (C) 2008-2015, International Business Machines Corporation
* and others. All Rights Reserved.
***************************************************************************
* file name: uspoof_build.cpp
* encoding: US-ASCII
* tab size: 8 (not used)
* indentation:4
*
* created on: 2008 Dec 8
* created by: Andy Heninger
*
* Unicode Spoof Detection Data Builder
* Builder-related functions are kept in separate files so that applications not needing
* the builder can more easily exclude them, typically by means of static linking.
*
* There are three relatively independent sets of Spoof data,
* Confusables,
* Whole Script Confusables
* ID character extensions.
*
* The data tables for each are built separately, each from its own definitions
*/
#include "starboard/client_porting/poem/string_poem.h"
#include "unicode/utypes.h"
#include "unicode/uspoof.h"
#include "unicode/unorm.h"
#include "unicode/uregex.h"
#include "unicode/ustring.h"
#include "cmemory.h"
#include "uspoof_impl.h"
#include "uhash.h"
#include "uvector.h"
#include "uassert.h"
#include "uarrsort.h"
#include "uspoof_conf.h"
#include "uspoof_wsconf.h"
#if !UCONFIG_NO_NORMALIZATION
U_NAMESPACE_USE
// Defined in uspoof.cpp, initializes file-static variables.
U_CFUNC void uspoof_internalInitStatics(UErrorCode *status);
// The main data building function
U_CAPI USpoofChecker * U_EXPORT2
uspoof_openFromSource(const char *confusables, int32_t confusablesLen,
const char *confusablesWholeScript, int32_t confusablesWholeScriptLen,
int32_t *errorType, UParseError *pe, UErrorCode *status) {
uspoof_internalInitStatics(status);
if (U_FAILURE(*status)) {
return NULL;
}
#if UCONFIG_NO_REGULAR_EXPRESSIONS
*status = U_UNSUPPORTED_ERROR;
return NULL;
#else
if (errorType!=NULL) {
*errorType = 0;
}
if (pe != NULL) {
pe->line = 0;
pe->offset = 0;
pe->preContext[0] = 0;
pe->postContext[0] = 0;
}
// Set up a shell of a spoof detector, with empty data.
SpoofData *newSpoofData = new SpoofData(*status);
SpoofImpl *This = new SpoofImpl(newSpoofData, *status);
// Compile the binary data from the source (text) format.
ConfusabledataBuilder::buildConfusableData(This, confusables, confusablesLen, errorType, pe, *status);
buildWSConfusableData(This, confusablesWholeScript, confusablesWholeScriptLen, pe, *status);
if (U_FAILURE(*status)) {
delete This;
This = NULL;
}
return (USpoofChecker *)This;
#endif // UCONFIG_NO_REGULAR_EXPRESSIONS
}
#endif