node/deps/icu-small/source/i18n/collationsets.h

// © 2016 and later: Unicode, Inc. and others.
// License & terms of use: http://www.unicode.org/copyright.html
/*
*******************************************************************************
* Copyright (C) 2013-2014, International Business Machines
* Corporation and others.  All Rights Reserved.
*******************************************************************************
* collationsets.h
*
* created on: 2013feb09
* created by: Markus W. Scherer
*/

#ifndef __COLLATIONSETS_H__
#define __COLLATIONSETS_H__

#include "unicode/utypes.h"

#if !UCONFIG_NO_COLLATION

#include "unicode/uniset.h"
#include "collation.h"

U_NAMESPACE_BEGIN

struct CollationData;

/**
 * Finds the set of characters and strings that sort differently in the tailoring
 * from the base data.
 *
 * Every mapping in the tailoring needs to be compared to the base,
 * because some mappings are copied for optimization, and
 * all contractions for a character are copied if any contractions for that character
 * are added, modified or removed.
 *
 * It might be simpler to re-parse the rule string, but:
 * - That would require duplicating some of the from-rules builder code.
 * - That would make the runtime code depend on the builder.
 * - That would only work if we have the rule string, and we allow users to
 *   omit the rule string from data files.
 */
class TailoredSet : public UMemory {
public:
    TailoredSet(UnicodeSet *t)
            : data(NULL), baseData(NULL),
              tailored(t),
              suffix(NULL),
              errorCode(U_ZERO_ERROR) {}

    void forData(const CollationData *d, UErrorCode &errorCode);

    /**
     * @return U_SUCCESS(errorCode) in C++, void in Java
     * @internal only public for access by callback
     */
    UBool handleCE32(UChar32 start, UChar32 end, uint32_t ce32);

private:
    void compare(UChar32 c, uint32_t ce32, uint32_t baseCE32);
    void comparePrefixes(UChar32 c, const UChar *p, const UChar *q);
    void compareContractions(UChar32 c, const UChar *p, const UChar *q);

    void addPrefixes(const CollationData *d, UChar32 c, const UChar *p);
    void addPrefix(const CollationData *d, const UnicodeString &pfx, UChar32 c, uint32_t ce32);
    void addContractions(UChar32 c, const UChar *p);
    void addSuffix(UChar32 c, const UnicodeString &sfx);
    void add(UChar32 c);

    /** Prefixes are reversed in the data structure. */
    void setPrefix(const UnicodeString &pfx) {
        unreversedPrefix = pfx;
        unreversedPrefix.reverse();
    }
    void resetPrefix() {
        unreversedPrefix.remove();
    }

    const CollationData *data;
    const CollationData *baseData;
    UnicodeSet *tailored;
    UnicodeString unreversedPrefix;
    const UnicodeString *suffix;
    UErrorCode errorCode;
};

class ContractionsAndExpansions : public UMemory {
public:
    class CESink : public UMemory {
    public:
        virtual ~CESink();
        virtual void handleCE(int64_t ce) = 0;
        virtual void handleExpansion(const int64_t ces[], int32_t length) = 0;
    };

    ContractionsAndExpansions(UnicodeSet *con, UnicodeSet *exp, CESink *s, UBool prefixes)
            : data(NULL),
              contractions(con), expansions(exp),
              sink(s),
              addPrefixes(prefixes),
              checkTailored(0),
              suffix(NULL),
              errorCode(U_ZERO_ERROR) {}

    void forData(const CollationData *d, UErrorCode &errorCode);
    void forCodePoint(const CollationData *d, UChar32 c, UErrorCode &ec);

    // all following: @internal, only public for access by callback

    void handleCE32(UChar32 start, UChar32 end, uint32_t ce32);

    void handlePrefixes(UChar32 start, UChar32 end, uint32_t ce32);
    void handleContractions(UChar32 start, UChar32 end, uint32_t ce32);

    void addExpansions(UChar32 start, UChar32 end);
    void addStrings(UChar32 start, UChar32 end, UnicodeSet *set);

    /** Prefixes are reversed in the data structure. */
    void setPrefix(const UnicodeString &pfx) {
        unreversedPrefix = pfx;
        unreversedPrefix.reverse();
    }
    void resetPrefix() {
        unreversedPrefix.remove();
    }

    const CollationData *data;
    UnicodeSet *contractions;
    UnicodeSet *expansions;
    CESink *sink;
    UBool addPrefixes;
    int8_t checkTailored;  // -1: collected tailored  +1: exclude tailored
    UnicodeSet tailored;
    UnicodeSet ranges;
    UnicodeString unreversedPrefix;
    const UnicodeString *suffix;
    int64_t ces[Collation::MAX_EXPANSION_LENGTH];
    UErrorCode errorCode;
};

U_NAMESPACE_END

#endif  // !UCONFIG_NO_COLLATION
#endif  // __COLLATIONSETS_H__
deps: ICU 59.1 bump * No feature changes. * Bug fixes. * Details: http://site.icu-project.org/download/59 Fixes: https://github.com/nodejs/node/issues/12077 PR-URL: https://github.com/nodejs/node/pull/12486 Refs: https://github.com/nodejs/node/issues/7844 Reviewed-By: James M Snell <jasnell@gmail.com> Reviewed-By: Michael Dawson <michael_dawson@ca.ibm.com> Reviewed-By: Refael Ackermann <refack@gmail.com> 8 years ago			`// © 2016 and later: Unicode, Inc. and others.`
deps: Intl: ICU 58 bump - small icu (BIG COMMIT) This commit contains the ICU 58.1 delta. It is especially large because of the ICU license change, and, because the line endings were off previously. * bump to ICU 58.1 - check in small ICU source * from 58.1 final http://site.icu-project.org/download/58 Fixes: https://github.com/nodejs/node/issues/7844 PR-URL: https://github.com/nodejs/node/pull/9234 Reviewed-By: James M Snell <jasnell@gmail.com> 8 years ago			`// License & terms of use: http://www.unicode.org/copyright.html`
deps: Intl: Check in "small-icu" 57.1 * this commit has "small" ICU 57.1. See other related commit for tools to generate this commit. Fixes: https://github.com/nodejs/node/issues/3476 PR-URL: https://github.com/nodejs/node/pull/6088 Reviewed-By: James M Snell <jasnell@gmail.com> 9 years ago			`/*`
			`*******************************************************************************`
			`* Copyright (C) 2013-2014, International Business Machines`
			`* Corporation and others. All Rights Reserved.`
			`*******************************************************************************`
			`* collationsets.h`
			`*`
			`* created on: 2013feb09`
			`* created by: Markus W. Scherer`
			`*/`

			`#ifndef __COLLATIONSETS_H__`
			`#define __COLLATIONSETS_H__`

			`#include "unicode/utypes.h"`

			`#if !UCONFIG_NO_COLLATION`

			`#include "unicode/uniset.h"`
			`#include "collation.h"`

			`U_NAMESPACE_BEGIN`

			`struct CollationData;`

			`/**`
			`* Finds the set of characters and strings that sort differently in the tailoring`
			`* from the base data.`
			`*`
			`* Every mapping in the tailoring needs to be compared to the base,`
			`* because some mappings are copied for optimization, and`
			`* all contractions for a character are copied if any contractions for that character`
			`* are added, modified or removed.`
			`*`
			`* It might be simpler to re-parse the rule string, but:`
			`* - That would require duplicating some of the from-rules builder code.`
			`* - That would make the runtime code depend on the builder.`
			`* - That would only work if we have the rule string, and we allow users to`
			`* omit the rule string from data files.`
			`*/`
			`class TailoredSet : public UMemory {`
			`public:`
			`TailoredSet(UnicodeSet *t)`
			`: data(NULL), baseData(NULL),`
			`tailored(t),`
			`suffix(NULL),`
			`errorCode(U_ZERO_ERROR) {}`

			`void forData(const CollationData *d, UErrorCode &errorCode);`

			`/**`
			`* @return U_SUCCESS(errorCode) in C++, void in Java`
			`* @internal only public for access by callback`
			`*/`
			`UBool handleCE32(UChar32 start, UChar32 end, uint32_t ce32);`

			`private:`
			`void compare(UChar32 c, uint32_t ce32, uint32_t baseCE32);`
			`void comparePrefixes(UChar32 c, const UChar p, const UChar q);`
			`void compareContractions(UChar32 c, const UChar p, const UChar q);`

			`void addPrefixes(const CollationData d, UChar32 c, const UChar p);`
			`void addPrefix(const CollationData *d, const UnicodeString &pfx, UChar32 c, uint32_t ce32);`
			`void addContractions(UChar32 c, const UChar *p);`
			`void addSuffix(UChar32 c, const UnicodeString &sfx);`
			`void add(UChar32 c);`

			`/** Prefixes are reversed in the data structure. */`
			`void setPrefix(const UnicodeString &pfx) {`
			`unreversedPrefix = pfx;`
			`unreversedPrefix.reverse();`
			`}`
			`void resetPrefix() {`
			`unreversedPrefix.remove();`
			`}`

			`const CollationData *data;`
			`const CollationData *baseData;`
			`UnicodeSet *tailored;`
			`UnicodeString unreversedPrefix;`
			`const UnicodeString *suffix;`
			`UErrorCode errorCode;`
			`};`

			`class ContractionsAndExpansions : public UMemory {`
			`public:`
			`class CESink : public UMemory {`
			`public:`
			`virtual ~CESink();`
			`virtual void handleCE(int64_t ce) = 0;`
			`virtual void handleExpansion(const int64_t ces[], int32_t length) = 0;`
			`};`

			`ContractionsAndExpansions(UnicodeSet con, UnicodeSet exp, CESink *s, UBool prefixes)`
			`: data(NULL),`
			`contractions(con), expansions(exp),`
			`sink(s),`
			`addPrefixes(prefixes),`
			`checkTailored(0),`
			`suffix(NULL),`
			`errorCode(U_ZERO_ERROR) {}`

			`void forData(const CollationData *d, UErrorCode &errorCode);`
			`void forCodePoint(const CollationData *d, UChar32 c, UErrorCode &ec);`

			`// all following: @internal, only public for access by callback`

			`void handleCE32(UChar32 start, UChar32 end, uint32_t ce32);`

			`void handlePrefixes(UChar32 start, UChar32 end, uint32_t ce32);`
			`void handleContractions(UChar32 start, UChar32 end, uint32_t ce32);`

			`void addExpansions(UChar32 start, UChar32 end);`
			`void addStrings(UChar32 start, UChar32 end, UnicodeSet *set);`

			`/** Prefixes are reversed in the data structure. */`
			`void setPrefix(const UnicodeString &pfx) {`
			`unreversedPrefix = pfx;`
			`unreversedPrefix.reverse();`
			`}`
			`void resetPrefix() {`
			`unreversedPrefix.remove();`
			`}`

			`const CollationData *data;`
			`UnicodeSet *contractions;`
			`UnicodeSet *expansions;`
			`CESink *sink;`
			`UBool addPrefixes;`
			`int8_t checkTailored; // -1: collected tailored +1: exclude tailored`
			`UnicodeSet tailored;`
			`UnicodeSet ranges;`
			`UnicodeString unreversedPrefix;`
			`const UnicodeString *suffix;`
			`int64_t ces[Collation::MAX_EXPANSION_LENGTH];`
			`UErrorCode errorCode;`
			`};`

			`U_NAMESPACE_END`

			`#endif // !UCONFIG_NO_COLLATION`
			`#endif // __COLLATIONSETS_H__`