icu/icu4c/source/i18n/messageformat2_checker.h
Tim Chevalier 62b95bb5f9 ICU-22908 MF2: Update spec tests and update implementation for recent spec changes
Updating the spec tests requires two implementation changes:
* Match on variables rather than expressions --
  see https://github.com/unicode-org/message-format-wg/pull/877
* Require attribute values to be literals (if present) --
  see https://github.com/unicode-org/message-format-wg/pull/894

This updates the spec tests to commit 6c3704f41a9c24427126429fb43992b03609dfc8
in https://github.com/unicode-org/message-format-wg/ . Any changes
following that commit will be addressed in a future PR.
2024-12-09 09:38:28 -08:00

109 lines
3.5 KiB
C++

// © 2024 and later: Unicode, Inc. and others.
// License & terms of use: http://www.unicode.org/copyright.html
#include "unicode/utypes.h"
#ifndef U_HIDE_DEPRECATED_API
#ifndef MESSAGEFORMAT_CHECKER_H
#define MESSAGEFORMAT_CHECKER_H
#if U_SHOW_CPLUSPLUS_API
#if !UCONFIG_NO_NORMALIZATION
#if !UCONFIG_NO_FORMATTING
#if !UCONFIG_NO_MF2
#include "unicode/messageformat2_data_model.h"
#include "messageformat2_errors.h"
U_NAMESPACE_BEGIN
namespace message2 {
using namespace data_model;
// Used for checking missing selector annotation errors
// and duplicate declaration errors (specifically for
// implicit declarations)
class TypeEnvironment : public UMemory {
public:
// MessageFormat has a simple type system;
// variables are in-scope and annotated; in-scope and unannotated;
// or free (a free variable has no explicit declaration in the scope
// of its use.)
enum Type {
Annotated,
Unannotated,
FreeVariable
};
void extend(const VariableName&, Type, UErrorCode& status);
Type get(const VariableName&) const;
bool known(const VariableName&) const;
TypeEnvironment(UErrorCode& status);
virtual ~TypeEnvironment();
private:
// Stores variables known to be annotated.
LocalPointer<UVector> annotated; // Vector of `VariableName`s
// Stores variables that are in-scope but unannotated.
LocalPointer<UVector> unannotated; // Vector of `VariableName`s
// Stores free variables that are used in the RHS of a declaration
LocalPointer<UVector> freeVars; // Vector of `VariableNames`; tracks free variables
// This can't just be "variables that don't appear in
// `annotated` or `unannotated`", as a use introduces
// an explicit declaration
}; // class TypeEnvironment
class MessageFormatter;
// Checks a data model for semantic errors
// (Errors are defined in https://github.com/unicode-org/message-format-wg/blob/main/spec/formatting.md )
class Checker {
public:
void check(UErrorCode&);
Checker(const MFDataModel& d, StaticErrors& e, const MessageFormatter& mf)
: dataModel(d), errors(e), context(mf) {}
private:
Key normalizeNFC(const Key&) const;
void requireAnnotated(const TypeEnvironment&, const VariableName&, UErrorCode&);
void addFreeVars(TypeEnvironment& t, const Operand&, UErrorCode&);
void addFreeVars(TypeEnvironment& t, const Operator&, UErrorCode&);
void addFreeVars(TypeEnvironment& t, const OptionMap&, UErrorCode&);
void addFreeVars(TypeEnvironment& t, const Expression&, UErrorCode&);
void checkDeclarations(TypeEnvironment&, UErrorCode&);
void checkSelectors(const TypeEnvironment&, UErrorCode&);
void checkVariants(UErrorCode&);
void check(const OptionMap&);
void check(const Operand&);
void check(const Expression&);
void check(const Pattern&);
const MFDataModel& dataModel;
StaticErrors& errors;
// Used for NFC normalization
const MessageFormatter& context;
}; // class Checker
} // namespace message2
U_NAMESPACE_END
#endif /* #if !UCONFIG_NO_MF2 */
#endif /* #if !UCONFIG_NO_FORMATTING */
#endif /* #if !UCONFIG_NO_NORMALIZATION */
#endif /* U_SHOW_CPLUSPLUS_API */
#endif // MESSAGEFORMAT_CHECKER_H
#endif // U_HIDE_DEPRECATED_API
// eof