diff --git a/.gitignore b/.gitignore
index 60e7ec63e..c6d5a34bd 100644
--- a/.gitignore
+++ b/.gitignore
@@ -43,6 +43,7 @@ perf-*.xml
 test-*.xml
 
 # Directories
+.idea/
 .settings/
 .vs/
 .vscode/
diff --git a/docs/ucdxml.md b/docs/ucdxml.md
new file mode 100644
index 000000000..6711254f4
--- /dev/null
+++ b/docs/ucdxml.md
@@ -0,0 +1,69 @@
+# UCDXML
+
+There are three separate processes for generating and validating UCDXML files and their corresponding UAX42 report.
+
+1. Generate the UCDXML files.
+2. (Optional) You can compare the generated UCDXML files against each other (e.g., Flat vs Grouped) or against 
+   previous versions.
+3. Generate UAX42. There are three steps involved:
+
+   1. Generate the property value fragments. The updated versions should live in 
+      unicodetools/src/main/resources/org/unicode/uax42/fragments
+   2. Generate the index.html and index.rnc files for UAX42.
+   3. (Optional) Validate the UCDXML files using index.rnc.
+
+## Generate UCDXML files
+
+- You can generate flat or grouped versions of UCDXML.
+- You can generate UCDXML files for:
+  - the full range of code points
+  - the Unihan code points
+  - code points that are not Unihan code points
+
+```
+mvn compile exec:java '-Dexec.mainClass="org.unicode.xml.UCDXML"' '-Dexec.args="--range ALL --output FLAT"' -DCLDR_DIR=$(cd ../cldr; pwd) -DUNICODETOOLS_GEN_DIR=$(cd ../Generated; pwd) -DUNICODETOOLS_REPO_DIR=$(pwd)
+mvn compile exec:java '-Dexec.mainClass="org.unicode.xml.UCDXML"' '-Dexec.args="--range UNIHAN --output FLAT"' -DCLDR_DIR=$(cd ../cldr; pwd) -DUNICODETOOLS_GEN_DIR=$(cd ../Generated; pwd) -DUNICODETOOLS_REPO_DIR=$(pwd)
+mvn compile exec:java '-Dexec.mainClass="org.unicode.xml.UCDXML"' '-Dexec.args="--range NOUNIHAN --output FLAT"' -DCLDR_DIR=$(cd ../cldr; pwd) -DUNICODETOOLS_GEN_DIR=$(cd ../Generated; pwd) -DUNICODETOOLS_REPO_DIR=$(pwd)
+mvn compile exec:java '-Dexec.mainClass="org.unicode.xml.UCDXML"' '-Dexec.args="--range ALL --output GROUPED"' -DCLDR_DIR=$(cd ../cldr; pwd) -DUNICODETOOLS_GEN_DIR=$(cd ../Generated; pwd) -DUNICODETOOLS_REPO_DIR=$(pwd)
+mvn compile exec:java '-Dexec.mainClass="org.unicode.xml.UCDXML"' '-Dexec.args="--range UNIHAN --output GROUPED"' -DCLDR_DIR=$(cd ../cldr; pwd) -DUNICODETOOLS_GEN_DIR=$(cd ../Generated; pwd) -DUNICODETOOLS_REPO_DIR=$(pwd)
+mvn compile exec:java '-Dexec.mainClass="org.unicode.xml.UCDXML"' '-Dexec.args="--range NOUNIHAN --output GROUPED"' -DCLDR_DIR=$(cd ../cldr; pwd) -DUNICODETOOLS_GEN_DIR=$(cd ../Generated; pwd) -DUNICODETOOLS_REPO_DIR=$(pwd)
+```
+
+## Compare UCDXML files
+
+After generating UCDXML files, you can compare:
+
+- Different versions of the same type (range and output) of UCDXML file
+- Grouped and flat versions of the same code point range
+
+```
+mvn compile exec:java '-Dexec.mainClass="org.unicode.xml.CompareUCDXML"' '-Dexec.args="-a {path to file} -b {path to file}"'
+```
+
+## Generating TR42
+
+### Step 1 - Generate property value fragments
+
+```
+mvn compile exec:java '-Dexec.mainClass="org.unicode.xml.GeneratePropertyValues"' -DCLDR_DIR=$(cd ../cldr ; pwd) -DUNICODETOOLS_GEN_DIR=$(cd ../Generated ; pwd) -DUNICODETOOLS_REPO_DIR=$(pwd)
+```
+
+UAX42 fragments live in unicodetools/src/main/resources/org/unicode/uax42/fragments
+
+### Step 2 - Generate TR42 index.html and index.rnc 
+
+```
+mvn xml:transform -f $(cd ./unicodetools/src/main/resources/org/unicode/uax42; pwd) -Doutputdir=$(cd ../Generated/uax42; pwd)
+```
+
+### Step 3 - Validate generated UAX XML files
+
+You'll need a [RELAX NG](https://relaxng.org/) schema validator.
+We'll use [jing-trang](https://github.com/relaxng/jing-trang) in this example.
+
+1. Clone and build [jing-trang](https://github.com/relaxng/jing-trang)
+2. Run the following:
+    ```
+   java -jar C:\_git\jing-trang\build\jing.jar -c UNICODETOOLS_REPO_DIR\uax\uax42\output\index.rnc <path to UAX xml file>
+   ```
+   Note that the UAX xml file has to be saved as NFD as the Unihan syntax regular expressions are expecting NFD.
diff --git a/unicodetools/src/main/java/org/unicode/props/UcdProperty.java b/unicodetools/src/main/java/org/unicode/props/UcdProperty.java
index 914168c90..ec3d513a3 100644
--- a/unicodetools/src/main/java/org/unicode/props/UcdProperty.java
+++ b/unicodetools/src/main/java/org/unicode/props/UcdProperty.java
@@ -85,12 +85,16 @@ public enum UcdProperty {
     Emoji_SB(PropertyType.Miscellaneous, "ESB"),
     ISO_Comment(PropertyType.Miscellaneous, "isc"),
     Jamo_Short_Name(PropertyType.Miscellaneous, "JSN"),
+    NC_Corrected(PropertyType.Miscellaneous, "ncCorrected"),
+    NC_Original(PropertyType.Miscellaneous, "ncOriginal"),
+    NC_Version(PropertyType.Miscellaneous, "ncVersion"),
     Name(PropertyType.Miscellaneous, "na"),
     Name_Alias(PropertyType.Miscellaneous, null, ValueCardinality.Unordered, "Name_Alias"),
     Named_Sequences(PropertyType.Miscellaneous, "NS"),
     Named_Sequences_Prov(PropertyType.Miscellaneous, "NSP"),
     Standardized_Variant(PropertyType.Miscellaneous, null, ValueCardinality.Unordered, "SV"),
     Unicode_1_Name(PropertyType.Miscellaneous, "na1"),
+    emoji_variation_sequence(PropertyType.Miscellaneous, "EVS"),
     kAlternateHanYu(PropertyType.Miscellaneous, "cjkAlternateHanYu"),
     kAlternateJEF(PropertyType.Miscellaneous, "cjkAlternateJEF"),
     kAlternateKangXi(PropertyType.Miscellaneous, "cjkAlternateKangXi"),
diff --git a/unicodetools/src/main/java/org/unicode/props/UcdPropertyValues.java b/unicodetools/src/main/java/org/unicode/props/UcdPropertyValues.java
index f8bb22f1a..0aac98c26 100644
--- a/unicodetools/src/main/java/org/unicode/props/UcdPropertyValues.java
+++ b/unicodetools/src/main/java/org/unicode/props/UcdPropertyValues.java
@@ -766,6 +766,7 @@ public static East_Asian_Width_Values forName(String name) {
     // Emoji_DCM
     // Emoji_KDDI
     // Emoji_SB
+    // emoji_variation_sequence
     // Equivalent_Unified_Ideograph
     // FC_NFKC_Closure
     public enum General_Category_Values implements Named {
@@ -1668,6 +1669,9 @@ public static Line_Break_Values forName(String name) {
     // Name_Alias
     // Named_Sequences
     // Named_Sequences_Prov
+    // NC_Corrected
+    // NC_Original
+    // NC_Version
     public enum NFC_Quick_Check_Values implements Named {
         Maybe("M"),
         No("N"),
diff --git a/unicodetools/src/main/java/org/unicode/tools/emoji/LoadImage.java b/unicodetools/src/main/java/org/unicode/tools/emoji/LoadImage.java
index 7f9f3008b..c7912b690 100644
--- a/unicodetools/src/main/java/org/unicode/tools/emoji/LoadImage.java
+++ b/unicodetools/src/main/java/org/unicode/tools/emoji/LoadImage.java
@@ -891,7 +891,8 @@ public static void doSb(String outputDir) throws IOException {
         //                try {
         //                    copy(new URL(url), new File(outputDir + "/sb","sb_" + code + ".gif"));
         ////                    BufferedImage sourceImage = ImageIO.read(new URL(url));
-        ////                    writeImage(sourceImage,outputDir + "/sb","sb_" + code, "gif");
+        ////                    writeImage(sourceImage,outputDir + "/sb","sb_" + code,
+        // "gif");
         //                    System.out.println(code);
         //                } catch (Exception e) {
         //                    System.out.println("Skipping " + code);
diff --git a/unicodetools/src/main/java/org/unicode/xml/AttributeResolver.java b/unicodetools/src/main/java/org/unicode/xml/AttributeResolver.java
new file mode 100644
index 000000000..2d268878e
--- /dev/null
+++ b/unicodetools/src/main/java/org/unicode/xml/AttributeResolver.java
@@ -0,0 +1,351 @@
+package org.unicode.xml;
+
+import com.ibm.icu.impl.UnicodeMap;
+import com.ibm.icu.util.VersionInfo;
+import java.util.HashMap;
+import java.util.LinkedHashMap;
+import java.util.LinkedList;
+import java.util.List;
+import java.util.Locale;
+import java.util.Optional;
+import org.unicode.cldr.draft.FileUtilities;
+import org.unicode.props.IndexUnicodeProperties;
+import org.unicode.props.PropertyParsingInfo;
+import org.unicode.props.UcdLineParser;
+import org.unicode.props.UcdProperty;
+import org.unicode.props.UcdPropertyValues;
+import org.unicode.props.UnicodeProperty;
+
+/**
+ * Used by UCDXML to get string values of attributes for each code point from
+ * IndexUnicodeProperties.
+ */
+public class AttributeResolver {
+
+    private final IndexUnicodeProperties indexUnicodeProperties;
+    private final UnicodeMap<UcdPropertyValues.Age_Values> map_age;
+    private final UnicodeMap<UcdPropertyValues.Block_Values> map_block;
+    private final UnicodeMap<UcdPropertyValues.Decomposition_Type_Values> map_decomposition_type;
+    private final UnicodeMap<UcdPropertyValues.General_Category_Values> map_general_category;
+    private final UnicodeMap<UcdPropertyValues.Script_Values> map_script;
+    private final UnicodeMap<String> map_script_extensions;
+    private final HashMap<Integer, LinkedList<NameAlias>> map_NameAlias;
+
+    // If there is a change in any of these properties between two adjacent characters, it will
+    // result in a new range.
+    private final UCDPropertyDetail[] rangeDefiningPropertyDetails = {
+        UCDPropertyDetail.Age_Detail,
+        UCDPropertyDetail.Bidi_Class_Detail,
+        UCDPropertyDetail.Block_Detail,
+        UCDPropertyDetail.Decomposition_Mapping_Detail,
+        UCDPropertyDetail.Numeric_Type_Detail,
+        UCDPropertyDetail.Numeric_Value_Detail,
+        UCDPropertyDetail.Vertical_Orientation_Detail
+    };
+
+    public AttributeResolver(IndexUnicodeProperties iup) {
+        indexUnicodeProperties = iup;
+        map_age = indexUnicodeProperties.loadEnum(UcdProperty.Age);
+        map_block = indexUnicodeProperties.loadEnum(UcdProperty.Block);
+        map_decomposition_type = indexUnicodeProperties.loadEnum(UcdProperty.Decomposition_Type);
+        map_general_category = indexUnicodeProperties.loadEnum(UcdProperty.General_Category);
+        map_script = indexUnicodeProperties.loadEnum(UcdProperty.Script);
+        map_script_extensions =
+                indexUnicodeProperties.getProperty(UcdProperty.Script_Extensions).getUnicodeMap();
+
+        // UCD code is only set up to read a single Alias value from NameAliases.txt
+        // Instead, we'll load the Alias and the Type data as part of the constructor. We'll keep in
+        // memory as it
+        // NameAliases isn't too large.
+        map_NameAlias = loadNameAliases();
+    }
+
+    protected enum AliasType {
+        ABBREVIATION("abbreviation"),
+        ALTERNATE("alternate"),
+        CONTROL("control"),
+        CORRECTION("correction"),
+        FIGMENT("figment"),
+        NONE("none");
+
+        private final String aliasType;
+
+        AliasType(String aliasType) {
+            this.aliasType = aliasType;
+        }
+
+        public String toString() {
+            return aliasType;
+        }
+    }
+
+    private static class NameAlias {
+
+        private String alias;
+        private final AliasType type;
+
+        private NameAlias(String alias, AliasType type) {
+            this.alias = alias;
+            this.type = type;
+        }
+
+        public String getAlias() {
+            return alias;
+        }
+
+        public AliasType getType() {
+            return type;
+        }
+    }
+
+    private static class NameAliasComparator implements java.util.Comparator<NameAlias> {
+
+        @Override
+        public int compare(NameAlias o1, NameAlias o2) {
+            return o1.getAlias().compareTo(o2.getAlias());
+        }
+    }
+
+    private HashMap<Integer, LinkedList<NameAlias>> loadNameAliases() {
+        HashMap<Integer, LinkedList<NameAlias>> nameAliasesByCodePoint = new HashMap<>();
+        final PropertyParsingInfo fileInfo =
+                PropertyParsingInfo.getPropertyInfo(UcdProperty.Name_Alias);
+        String fullFilename = fileInfo.getFullFileName(indexUnicodeProperties.getUcdVersion());
+        UcdLineParser parser = new UcdLineParser(FileUtilities.in("", fullFilename));
+        NameAliasComparator nameAliasComparator = new NameAliasComparator();
+
+        for (UcdLineParser.UcdLine line : parser) {
+            String[] parts = line.getParts();
+            int codepoint = Integer.parseInt(parts[0], 16);
+            NameAlias nameAlias;
+            if (parts.length < 3) {
+                nameAlias = new NameAlias(parts[1], AliasType.NONE);
+            } else {
+                nameAlias =
+                        new NameAlias(
+                                parts[1], AliasType.valueOf(parts[2].toUpperCase(Locale.ROOT)));
+            }
+
+            if (nameAliasesByCodePoint.containsKey(codepoint)) {
+                LinkedList<NameAlias> nameAliases =
+                        new LinkedList<>(nameAliasesByCodePoint.get(codepoint));
+                nameAliases.add(nameAlias);
+                nameAliases.sort(nameAliasComparator);
+                nameAliasesByCodePoint.replace(codepoint, nameAliases);
+            } else {
+                nameAliasesByCodePoint.put(codepoint, new LinkedList<>(List.of(nameAlias)));
+            }
+        }
+        return nameAliasesByCodePoint;
+    }
+
+    public String getAttributeValue(UcdProperty prop, int codepoint) {
+        String resolvedValue = indexUnicodeProperties.getResolvedValue(prop, codepoint);
+        switch (prop.getType()) {
+            case Numeric:
+                switch (prop) {
+                    case kOtherNumeric:
+                    case kPrimaryNumeric:
+                    case kAccountingNumeric:
+                        return (resolvedValue.equals("NaN")) ? null : resolvedValue;
+                    default:
+                        return Optional.ofNullable(resolvedValue).orElse("NaN");
+                }
+            case String:
+                switch (prop) {
+                    case Equivalent_Unified_Ideograph:
+                        String EqUIdeo = getMappingValue(codepoint, resolvedValue, false, "");
+                        return (EqUIdeo.equals("#")) ? null : EqUIdeo;
+                    case kCompatibilityVariant:
+                        String kCompatibilityVariant =
+                                getMappingValue(codepoint, resolvedValue, false, "U+");
+                        return (kCompatibilityVariant.equals("#")) ? "" : kCompatibilityVariant;
+                    case kSimplifiedVariant:
+                    case kTraditionalVariant:
+                        String kVariant =
+                                getMappingValue(
+                                        codepoint,
+                                        resolvedValue,
+                                        isUnihanAttributeRange(codepoint),
+                                        "U+");
+                        return (kVariant.equals("#")) ? "" : kVariant;
+                    case Bidi_Mirroring_Glyph:
+                        // Returning empty string for bmg to maintain compatibility with older
+                        // generated files.
+                        String bmg = getMappingValue(codepoint, resolvedValue, false, "");
+                        return (bmg.equals("#")) ? "" : bmg;
+                    default:
+                        return getMappingValue(codepoint, resolvedValue, false, "");
+                }
+            case Miscellaneous:
+                switch (prop) {
+                    case Jamo_Short_Name:
+                        // return map_jamo_short_name.get(codepoint).getShortName();
+                        return Optional.ofNullable(resolvedValue).orElse("");
+                    case Name:
+                        if (resolvedValue != null
+                                && resolvedValue.startsWith("CJK UNIFIED IDEOGRAPH-")) {
+                            return "CJK UNIFIED IDEOGRAPH-#";
+                        }
+                        if (resolvedValue != null
+                                && resolvedValue.startsWith("CJK COMPATIBILITY IDEOGRAPH-")) {
+                            return "CJK COMPATIBILITY IDEOGRAPH-#";
+                        }
+                        if (resolvedValue != null
+                                && resolvedValue.startsWith("TANGUT IDEOGRAPH-")) {
+                            return "TANGUT IDEOGRAPH-#";
+                        }
+                        if (resolvedValue != null
+                                && resolvedValue.startsWith("KHITAN SMALL SCRIPT CHARACTER-")) {
+                            return "KHITAN SMALL SCRIPT CHARACTER-#";
+                        }
+                        if (resolvedValue != null && resolvedValue.startsWith("NUSHU CHARACTER-")) {
+                            return "NUSHU CHARACTER-#";
+                        }
+                        if (resolvedValue != null
+                                && resolvedValue.startsWith("EGYPTIAN HIEROGLYPH-")) {
+                            return "EGYPTIAN HIEROGLYPH-#";
+                        }
+                        return Optional.ofNullable(resolvedValue).orElse("");
+                    case kDefinition:
+                        return resolvedValue;
+                    default:
+                        if (resolvedValue != null) {
+                            return resolvedValue.replaceAll("\\|", " ");
+                        }
+                        return "";
+                }
+            case Catalog:
+                switch (prop) {
+                    case Age:
+                        String age = map_age.get(codepoint).getShortName();
+                        return (age.equals("NA")) ? "unassigned" : age;
+                    case Block:
+                        return map_block.get(codepoint).getShortName();
+                    case Script:
+                        return map_script.get(codepoint).getShortName();
+                    case Script_Extensions:
+                        StringBuilder extensionBuilder = new StringBuilder();
+                        String[] extensions = map_script_extensions.get(codepoint).split("\\|", 0);
+                        for (String extension : extensions) {
+                            extensionBuilder.append(
+                                    UcdPropertyValues.Script_Values.valueOf(extension)
+                                            .getShortName());
+                            extensionBuilder.append(" ");
+                        }
+                        return extensionBuilder.toString().trim();
+                    default:
+                        throw new RuntimeException("Missing Catalog case");
+                }
+            case Enumerated:
+                switch (prop) {
+                    case Decomposition_Type:
+                        // Returning lower case to maintain compatibility with older generated
+                        // files.
+                        return map_decomposition_type
+                                .get(codepoint)
+                                .getShortName()
+                                .toLowerCase(Locale.ROOT);
+                    default:
+                        final UnicodeProperty property = indexUnicodeProperties.getProperty(prop);
+                        final List<String> valueAliases =
+                                property.getValueAliases(property.getValue(codepoint));
+                        return valueAliases.get(0);
+                }
+            case Binary:
+                {
+                    switch (resolvedValue) {
+                            // Seems overkill to get this from UcdPropertyValues.Binary
+                        case "No":
+                            return "N";
+                        case "Yes":
+                            return "Y";
+                        default:
+                            throw new RuntimeException("Unexpected Binary value");
+                    }
+                }
+            default:
+                throw new RuntimeException("Missing PropertyType case");
+        }
+    }
+
+    public boolean isUnassignedCodePoint(int codepoint) {
+        return UcdPropertyValues.General_Category_Values.Unassigned.equals(getgc(codepoint))
+                || UcdPropertyValues.General_Category_Values.Private_Use.equals(getgc(codepoint))
+                || UcdPropertyValues.General_Category_Values.Surrogate.equals(getgc(codepoint));
+    }
+
+    public UcdPropertyValues.General_Category_Values getgc(int codepoint) {
+        return map_general_category.get(codepoint);
+    }
+
+    public String getNChar(int codepoint) {
+        return getAttributeValue(UcdProperty.Noncharacter_Code_Point, codepoint);
+    }
+
+    public HashMap<String, String> getNameAliases(int codepoint) {
+        HashMap<String, String> nameAliases = new LinkedHashMap<>();
+        LinkedList<NameAlias> nameAliasList = map_NameAlias.get(codepoint);
+        if (null != nameAliasList && !nameAliasList.isEmpty()) {
+            for (NameAlias nameAlias : nameAliasList) {
+                nameAliases.put(nameAlias.getAlias(), nameAlias.getType().toString());
+            }
+            return nameAliases;
+        }
+        return null;
+    }
+
+    private String getMappingValue(
+            int codepoint, String resolvedValue, boolean ignoreUnihanRange, String prefix) {
+        if (null == resolvedValue) {
+            return "#";
+        }
+        int[] resolvedValueInts = resolvedValue.codePoints().toArray();
+        if (resolvedValueInts.length == 1
+                && resolvedValueInts[0] == codepoint
+                && !ignoreUnihanRange) {
+            return "#";
+        }
+        StringBuilder sb = new StringBuilder();
+        for (int i : resolvedValueInts) {
+            sb.append(prefix).append(getCPString(i)).append(" ");
+        }
+        return sb.toString().trim();
+    }
+
+    public boolean isDifferentRange(VersionInfo ucdVersion, int codepointA, int codepointB) {
+        boolean isDifference = false;
+        for (UCDPropertyDetail propDetail : rangeDefiningPropertyDetails) {
+            UcdProperty prop = propDetail.getUcdProperty();
+            if (ucdVersion.compareTo(propDetail.getMinVersion()) >= 0
+                    && (propDetail.getMaxVersion() == null
+                            || ucdVersion.compareTo(propDetail.getMaxVersion()) < 0)) {
+                isDifference =
+                        isDifference
+                                || !getAttributeValue(prop, codepointA)
+                                        .equals(getAttributeValue(prop, codepointB));
+            }
+        }
+        return isDifference;
+    }
+
+    private static String getCPString(int codepoint) {
+        return String.format("%4s", Integer.toHexString(codepoint))
+                .replace(" ", "0")
+                .toUpperCase(Locale.ROOT);
+    }
+
+    public String getHexString(int codepoint) {
+        return getCPString(codepoint);
+    }
+
+    public boolean isUnihanAttributeRange(int codepoint) {
+        return getAttributeValue(UcdProperty.Unified_Ideograph, codepoint).equals("Y")
+                || !getAttributeValue(UcdProperty.kCompatibilityVariant, codepoint).isEmpty();
+    }
+
+    public boolean isUnifiedIdeograph(int codepoint) {
+        return getAttributeValue(UcdProperty.Unified_Ideograph, codepoint).equals("Y")
+                && getAttributeValue(UcdProperty.Name, codepoint).equals("CJK UNIFIED IDEOGRAPH-#");
+    }
+}
diff --git a/unicodetools/src/main/java/org/unicode/xml/CompareUCDXML.java b/unicodetools/src/main/java/org/unicode/xml/CompareUCDXML.java
new file mode 100644
index 000000000..f09f98e86
--- /dev/null
+++ b/unicodetools/src/main/java/org/unicode/xml/CompareUCDXML.java
@@ -0,0 +1,203 @@
+package org.unicode.xml;
+
+import com.ibm.icu.dev.tool.UOption;
+import com.ibm.icu.impl.UnicodeMap;
+import com.ibm.icu.text.UnicodeSet;
+import java.io.File;
+import java.io.IOException;
+import java.util.HashMap;
+import java.util.Objects;
+import org.unicode.props.UcdProperty;
+
+/**
+ * Utility for comparing two UCDXML files. Originally intended to compare UCDXML files generated
+ * using https://github.com/eric-muller/ucdxml to UCDXML files generated using
+ * org.unicode.xml.UCDXML.
+ */
+public class CompareUCDXML {
+
+    private static final String NEWLINE = System.getProperty("line.separator");
+    private static final UOption[] options = {
+        UOption.HELP_H(),
+        UOption.create("fileA", 'a', UOption.REQUIRES_ARG),
+        UOption.create("fileB", 'b', UOption.REQUIRES_ARG)
+    };
+
+    private static final UcdProperty[] codepointSequenceProperties =
+            new UcdProperty[] {
+                UcdProperty.Named_Sequences,
+                UcdProperty.Named_Sequences_Prov,
+                UcdProperty.Standardized_Variant,
+                UcdProperty.Emoji_DCM,
+                UcdProperty.Emoji_KDDI,
+                UcdProperty.Emoji_SB,
+                UcdProperty.Do_Not_Emit_Preferred
+            };
+
+    private static final HashMap<Integer, String[]> knownDifferences;
+
+    static {
+        knownDifferences = new HashMap<>();
+
+        // https://github.com/unicode-org/properties/issues/296
+        knownDifferences.put(0x31E4, new String[] {"Hani", "Zyyy"});
+        knownDifferences.put(0x31E5, new String[] {"Hani", "Zyyy"});
+
+        // https://github.com/unicode-org/unicodetools/issues/325
+        knownDifferences.put(0x109F7, new String[] {"1/6", "2/12"});
+        knownDifferences.put(0x109F8, new String[] {"1/4", "3/12"});
+        knownDifferences.put(0x109F9, new String[] {"1/3", "4/12"});
+        knownDifferences.put(0x109FB, new String[] {"1/2", "6/12"});
+        knownDifferences.put(0x109FD, new String[] {"2/3", "8/12"});
+        knownDifferences.put(0x109FE, new String[] {"3/4", "9/12"});
+        knownDifferences.put(0x109FF, new String[] {"5/6", "10/12"});
+
+        // https://github.com/unicode-org/properties/issues/172
+        knownDifferences.put(0x5146, new String[] {"1000000", "1000000 1000000000000"});
+        knownDifferences.put(0x79ED, new String[] {"1000000000", "1000000000 1000000000000"});
+    }
+
+    private static final int HELP = 0, FILE_A = 1, FILE_B = 2, LOGFILE = 3;
+
+    public static void main(String[] args) throws Exception {
+        File fileA = null;
+        File fileB = null;
+        int errorCount = 0;
+
+        UOption.parseArgs(args, options);
+
+        if (options[HELP].doesOccur) {
+            System.out.println("CompareUcdXML --fileA {file path} --fileB {file path}");
+            System.exit(0);
+        }
+
+        if (options[FILE_A].doesOccur) {
+            try {
+                fileA = new File(options[FILE_A].value);
+                if (!fileA.exists()) {
+                    throw new IOException();
+                }
+            } catch (Exception e) {
+                throw new IllegalArgumentException("Could not find " + options[FILE_A].value);
+            }
+        } else {
+            throw new IllegalArgumentException("Missing command line option: --fileA (or -a)");
+        }
+
+        if (options[FILE_B].doesOccur) {
+            try {
+                fileB = new File(options[FILE_B].value);
+                if (!fileB.exists()) {
+                    throw new IOException();
+                }
+            } catch (Exception e) {
+                throw new IllegalArgumentException("Could not find " + options[FILE_B].value);
+            }
+        } else {
+            throw new IllegalArgumentException("Missing command line option: --fileB (or -b)");
+        }
+
+        System.out.println("Comparing " + fileA + " and " + fileB);
+
+        final XMLProperties xmlPropsA = new XMLProperties(fileA);
+        final XMLProperties xmlPropsB = new XMLProperties(fileB);
+
+        // First, iterate through the UcdProperties on each codepoint.
+        for (final UcdProperty prop : UcdProperty.values()) {
+            UnicodeMap<String> fileAMap = xmlPropsA.getMap(prop);
+            UnicodeMap<String> fileBMap = xmlPropsB.getMap(prop);
+            if (!fileAMap.equals(fileBMap)) {
+                for (int i = 0; i <= 0x10ffff; ++i) {
+                    try {
+                        String xmlValA = fileAMap.get(i);
+                        String xmlValB = fileBMap.get(i);
+                        if (!Objects.equals(xmlValA, xmlValB)) {
+                            // At least one string is != null and the strings are different, but we
+                            // don't care if one
+                            // is null and one is empty_string
+                            // As far as we care, empty_string == null == "00000"
+                            int lenA =
+                                    (xmlValA == null
+                                            ? 0
+                                            : (xmlValA.equals("00000") ? 0 : xmlValA.length()));
+                            int lenB =
+                                    (xmlValB == null
+                                            ? 0
+                                            : (xmlValB.equals("00000") ? 0 : xmlValB.length()));
+                            if (!(lenA == 0 && lenB == 0)
+                                    && !isKnownDifference(i, xmlValA, xmlValB)) {
+                                errorCount++;
+                                System.out.println(
+                                        "For UCDProperty "
+                                                + prop.name()
+                                                + " ("
+                                                + prop.getShortName()
+                                                + ") ["
+                                                + String.format("0x%04X", i)
+                                                + "], ");
+                                System.out.println("\t" + fileA + " = " + xmlValA);
+                                System.out.println("\t" + fileB + " = " + xmlValB);
+                            }
+                        }
+                    } catch (Exception e) {
+                        System.out.println("Exception thrown for " + String.format("0x%04X", i));
+                        System.out.println(e.getMessage());
+                    }
+                }
+            }
+        }
+        // Now handle anything that contains codepoint sequences.
+        for (UcdProperty prop : codepointSequenceProperties) {
+            UnicodeMap<String> fileAMap = xmlPropsA.getMap(prop);
+            UnicodeMap<String> fileBMap = xmlPropsB.getMap(prop);
+            UnicodeSet differences = fileAMap.keySet().addAll(fileBMap.keySet());
+            for (String key : differences) {
+                try {
+                    String xmlValA = fileAMap.get(key);
+                    String xmlValB = fileBMap.get(key);
+                    if (!Objects.equals(xmlValA, xmlValB)) {
+                        // At least one string is != null and the strings are different, but we
+                        // don't care if one
+                        // is null and one is empty_string
+                        // As far as we care, empty_string == null == "00000"
+                        int lenA =
+                                (xmlValA == null
+                                        ? 0
+                                        : (xmlValA.equals("00000") ? 0 : xmlValA.length()));
+                        int lenB =
+                                (xmlValB == null
+                                        ? 0
+                                        : (xmlValB.equals("00000") ? 0 : xmlValB.length()));
+                        if (!(lenA == 0 && lenB == 0)) {
+                            errorCount++;
+                            System.out.println(
+                                    "For UCDProperty "
+                                            + prop.name()
+                                            + " ("
+                                            + prop.getShortName()
+                                            + ") ["
+                                            + key
+                                            + "], ");
+                            System.out.println("\t" + fileA + " = " + xmlValA);
+                            System.out.println("\t" + fileB + " = " + xmlValB);
+                        }
+                    }
+                } catch (Exception e) {
+                    System.out.println("Exception thrown for " + String.format("0x%04X", key));
+                    System.out.println(e.getMessage());
+                }
+            }
+        }
+        System.exit(errorCount);
+    }
+
+    private static boolean isKnownDifference(int codepoint, String xmlValA, String xmlValB) {
+        if (knownDifferences.containsKey(codepoint)) {
+            String knownValue1 = knownDifferences.get(codepoint)[0];
+            String knownValue2 = knownDifferences.get(codepoint)[1];
+            return (knownValue1.equals(xmlValA) && knownValue2.equals(xmlValB))
+                    || (knownValue1.equals(xmlValB) && knownValue2.equals(xmlValA));
+        }
+        return false;
+    }
+}
diff --git a/unicodetools/src/main/java/org/unicode/xml/GeneratePropertyValues.java b/unicodetools/src/main/java/org/unicode/xml/GeneratePropertyValues.java
new file mode 100644
index 000000000..0d28734b0
--- /dev/null
+++ b/unicodetools/src/main/java/org/unicode/xml/GeneratePropertyValues.java
@@ -0,0 +1,1772 @@
+package org.unicode.xml;
+
+import com.ibm.icu.dev.tool.UOption;
+import com.ibm.icu.util.VersionInfo;
+import java.io.BufferedWriter;
+import java.io.File;
+import java.io.FileOutputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.OutputStreamWriter;
+import java.net.URI;
+import java.net.URISyntaxException;
+import java.nio.charset.StandardCharsets;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.HashMap;
+import java.util.List;
+import java.util.regex.Matcher;
+import java.util.regex.Pattern;
+import org.unicode.props.PropertyParsingInfo;
+import org.unicode.props.UcdProperty;
+import org.unicode.props.UcdPropertyValues.*;
+import org.unicode.text.utility.Settings;
+
+/**
+ * Utility for generating fragments that describe the property values in a format that can be
+ * displayed in UAX42. UAX42 fragments live in
+ * unicodetools/src/main/resources/org/unicode/uax42/fragments
+ */
+public class GeneratePropertyValues {
+
+    private enum VALUESOUTPUTTYPE {
+        VALUE_PER_LINE,
+        ALPHABETICAL_GROUP,
+        NUMERICAL_GROUP,
+        MAX_LINE_LENGTH;
+    }
+
+    private enum SCHEMA {
+        // Manual indicates a fragment file that is maintained manually rather than generated from
+        // this utility.
+        // Manual
+        NAMESPACE("namespace"),
+        // Manual
+        DATATYPES("datatypes"),
+        // Manual
+        START("start"),
+        BOOLEAN("boolean"),
+        // Manual
+        DESCRIPTION("description"),
+        // Manual
+        REPERTOIRE("repertoire"),
+        PROPERTIES("properties"),
+        TANGUT("tangut"),
+        NUSHU("nushu"),
+        EMOJI_DATA("emoji-data"),
+        // Manual
+        BLOCK("block"),
+        // Manual
+        NAMED_SEQUENCES("named-sequences"),
+        // Manual
+        NORMALIZATION_CORRECTIONS("normalization-corrections"),
+        // Manual
+        STANDARDIZED_VARIANTS("standardized-variants"),
+        // Manual
+        CJK_RADICALS("cjk-radicals"),
+        // Manual
+        EMOJI_SOURCES("emoji-sources"),
+        DO_NOT_EMIT("do-not-emit");
+
+        final String name;
+
+        SCHEMA(String name) {
+            this.name = name;
+        }
+
+        String getName() {
+            return this.name;
+        }
+    }
+
+    private static final class TR38Details {
+        boolean isList;
+        String syntax;
+
+        public TR38Details(boolean isList, String syntax) {
+            this.isList = isList;
+            this.syntax = syntax;
+        }
+
+        public boolean isList() {
+            return isList;
+        }
+
+        public String getSyntax() {
+            return syntax;
+        }
+    }
+
+    private static final int MAX_LINE_LENGTH = 70;
+    private static final String NEWLINE = System.lineSeparator();
+    private static final String DOUBLELINE = System.lineSeparator() + System.lineSeparator();
+    private static final String TRIPLELINE =
+            System.lineSeparator() + System.lineSeparator() + System.lineSeparator();
+    private static File destinationFolder = null;
+
+    private static HashMap<String, TR38Details> syntaxTR38;
+    private static final String NAMESPACE = "http://unicode.org/ns/2001/ucdxml";
+    private static final String TR38URL = "https://www.unicode.org/reports/tr38";
+    private static final UOption[] options = {
+        UOption.HELP_H(),
+        UOption.create("ucdversion", 'v', UOption.OPTIONAL_ARG),
+        UOption.create("outputfolder", 'f', UOption.REQUIRES_ARG)
+    };
+
+    private static final int HELP = 0, UCDVERSION = 1, OUTPUTFOLDER = 2;
+
+    public static void main(String[] args) throws Exception {
+
+        VersionInfo ucdVersion = null;
+
+        UOption.parseArgs(args, options);
+
+        if (options[HELP].doesOccur) {
+            System.out.println(
+                    "GeneratePropertyValuesList [--ucdversion {version number}] [--outputfolder {destination}]");
+            System.exit(0);
+        }
+
+        try {
+            if (options[UCDVERSION].doesOccur) {
+                try {
+                    ucdVersion = VersionInfo.getInstance(options[UCDVERSION].value);
+                } catch (Exception e) {
+                    throw new IllegalArgumentException(
+                            "Could not convert "
+                                    + options[UCDVERSION].value
+                                    + " to a valid UCD version");
+                }
+            } else {
+                ucdVersion = VersionInfo.getInstance(Settings.latestVersion);
+            }
+            if (options[OUTPUTFOLDER].doesOccur) {
+                try {
+                    destinationFolder = new File(options[OUTPUTFOLDER].value);
+                    if (!destinationFolder.exists()) {
+                        if (!destinationFolder.mkdirs()) {
+                            throw new IOException();
+                        }
+                    }
+                } catch (Exception e) {
+                    throw new IllegalArgumentException(
+                            "Could not find or create " + options[OUTPUTFOLDER].value);
+                }
+            } else {
+                try {
+                    destinationFolder = new File(Settings.Output.GEN_DIR + "uax42\\fragments\\");
+                    if (!destinationFolder.exists()) {
+                        if (!destinationFolder.mkdirs()) {
+                            throw new IOException();
+                        }
+                    }
+                } catch (Exception e) {
+                    throw new IllegalArgumentException(
+                            "Could not find or create "
+                                    + Settings.Output.GEN_DIR
+                                    + "uax42\\fragments\\");
+                }
+            }
+
+        } catch (Exception e) {
+            System.err.println(e.getMessage());
+            System.exit(1);
+        }
+
+        if (ucdVersion != null && destinationFolder.exists()) {
+            buildPropertyValues(ucdVersion);
+            System.out.println("End");
+            System.exit(0);
+        } else {
+            System.err.println("Unexpected error when generating uax42 fragment files.");
+            System.exit(1);
+        }
+    }
+
+    private static void buildPropertyValues(
+            // It would be nice to be able to generate values by ucdVersion. Leaving this here for
+            // now...
+            VersionInfo ucdVersion) throws IOException, URISyntaxException {
+        syntaxTR38 = parseTR38();
+
+        createPropertyFragment(
+                SCHEMA.BOOLEAN,
+                getFormattedValues(SCHEMA.BOOLEAN, VALUESOUTPUTTYPE.MAX_LINE_LENGTH));
+        createPropertyFragment(
+                UcdProperty.Age,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(UcdProperty.Age, VALUESOUTPUTTYPE.NUMERICAL_GROUP));
+        createPropertyFragment(
+                UcdProperty.Name, SCHEMA.PROPERTIES, getFormattedSyntax(UcdProperty.Name));
+        createPropertyFragment(
+                UcdProperty.Unicode_1_Name,
+                SCHEMA.PROPERTIES,
+                getFormattedSyntax(UcdProperty.Unicode_1_Name));
+        createPropertyFragment(
+                UcdProperty.Name_Alias.getShortName() + ".xml",
+                "name-alias element",
+                SCHEMA.PROPERTIES,
+                getFormattedElement(UcdProperty.Name_Alias));
+        createPropertyFragment(
+                UcdProperty.Block,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(UcdProperty.Block, VALUESOUTPUTTYPE.VALUE_PER_LINE));
+        createPropertyFragment(
+                UcdProperty.General_Category,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(
+                        UcdProperty.General_Category, VALUESOUTPUTTYPE.ALPHABETICAL_GROUP));
+        createPropertyFragment(
+                UcdProperty.Canonical_Combining_Class,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(
+                        UcdProperty.Canonical_Combining_Class, VALUESOUTPUTTYPE.VALUE_PER_LINE));
+        createPropertyFragment(
+                UcdProperty.Bidi_Class,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(UcdProperty.Bidi_Class, VALUESOUTPUTTYPE.ALPHABETICAL_GROUP));
+        createPropertyFragment(
+                UcdProperty.Bidi_Mirrored,
+                SCHEMA.PROPERTIES,
+                getFormattedBoolean(UcdProperty.Bidi_Mirrored));
+        createPropertyFragment(
+                UcdProperty.Bidi_Mirroring_Glyph,
+                SCHEMA.PROPERTIES,
+                getFormattedSyntax(UcdProperty.Bidi_Mirroring_Glyph));
+        createPropertyFragment(
+                UcdProperty.Bidi_Control,
+                SCHEMA.PROPERTIES,
+                getFormattedBoolean(UcdProperty.Bidi_Control));
+        createPropertyFragment(
+                UcdProperty.Bidi_Paired_Bracket_Type,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(
+                        UcdProperty.Bidi_Paired_Bracket_Type, VALUESOUTPUTTYPE.MAX_LINE_LENGTH));
+        createPropertyFragment(
+                UcdProperty.Bidi_Paired_Bracket,
+                SCHEMA.PROPERTIES,
+                getFormattedSyntax(UcdProperty.Bidi_Paired_Bracket));
+        createPropertyFragment(
+                "decomposition.xml",
+                "decomposition properties",
+                SCHEMA.PROPERTIES,
+                getFormattedDecompositionProperties());
+        createPropertyFragment(
+                "composition.xml",
+                "composition properties",
+                SCHEMA.PROPERTIES,
+                getFormattedCompositionProperties());
+        createPropertyFragment(
+                "quickcheck.xml",
+                "quick check properties",
+                SCHEMA.PROPERTIES,
+                getFormattedQuickCheckProperties());
+        createPropertyFragment(
+                "numeric.xml",
+                "numeric properties",
+                SCHEMA.PROPERTIES,
+                getFormattedNumericProperties());
+        createPropertyFragment(
+                "joining.xml",
+                "joining properties",
+                SCHEMA.PROPERTIES,
+                getFormattedJoiningProperties());
+        createPropertyFragment(
+                UcdProperty.Join_Control.getShortName() + ".xml",
+                "joining properties",
+                SCHEMA.PROPERTIES,
+                getFormattedBoolean(UcdProperty.Join_Control));
+        createPropertyFragment(
+                UcdProperty.Line_Break,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(UcdProperty.Line_Break, VALUESOUTPUTTYPE.ALPHABETICAL_GROUP));
+        createPropertyFragment(
+                UcdProperty.East_Asian_Width,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(
+                        UcdProperty.East_Asian_Width, VALUESOUTPUTTYPE.MAX_LINE_LENGTH));
+        createPropertyFragment(
+                "casing.xml",
+                "casing properties",
+                SCHEMA.PROPERTIES,
+                getFormattedCasingProperties());
+        createPropertyFragment(
+                "simple_case_mapping.xml",
+                "casing properties",
+                SCHEMA.PROPERTIES,
+                getFormattedSimpleCaseMappingProperties());
+        createPropertyFragment(
+                "case_mapping.xml",
+                "casing properties",
+                SCHEMA.PROPERTIES,
+                getFormattedCaseMappingProperties());
+        createPropertyFragment(
+                "case_folding.xml",
+                "casing properties",
+                SCHEMA.PROPERTIES,
+                getFormattedCaseFoldingProperties());
+        createPropertyFragment(
+                "case_other.xml",
+                "casing properties",
+                SCHEMA.PROPERTIES,
+                getFormattedCaseOtherProperties());
+        createPropertyFragment(
+                "script.xml",
+                "script properties",
+                SCHEMA.PROPERTIES,
+                getFormattedScriptProperties());
+        createPropertyFragment(
+                UcdProperty.ISO_Comment,
+                SCHEMA.PROPERTIES,
+                getFormattedSyntax(UcdProperty.ISO_Comment));
+        createPropertyFragment(
+                UcdProperty.Hangul_Syllable_Type,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(
+                        UcdProperty.Hangul_Syllable_Type, VALUESOUTPUTTYPE.MAX_LINE_LENGTH));
+        createPropertyFragment(
+                UcdProperty.Jamo_Short_Name,
+                SCHEMA.PROPERTIES,
+                getFormattedSyntax(UcdProperty.Jamo_Short_Name));
+        createPropertyFragment(
+                UcdProperty.Indic_Syllabic_Category,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(
+                        UcdProperty.Indic_Syllabic_Category, VALUESOUTPUTTYPE.VALUE_PER_LINE));
+        createPropertyFragment(
+                UcdProperty.Indic_Positional_Category,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(
+                        UcdProperty.Indic_Positional_Category, VALUESOUTPUTTYPE.VALUE_PER_LINE));
+        createPropertyFragment(
+                UcdProperty.Indic_Conjunct_Break,
+                SCHEMA.PROPERTIES,
+                getFormattedAttribute(
+                        UcdProperty.Indic_Conjunct_Break, VALUESOUTPUTTYPE.VALUE_PER_LINE));
+        createPropertyFragment(
+                "identifier.xml",
+                "identifier properties",
+                SCHEMA.PROPERTIES,
+                getFormattedIdentifierProperties());
+        createPropertyFragment(
+                "pattern.xml",
+                "pattern properties",
+                SCHEMA.PROPERTIES,
+                getFormattedPatternProperties());
+        createPropertyFragment(
+                "function_graphic.xml",
+                "properties related to function and graphic characteristics",
+                SCHEMA.PROPERTIES,
+                getFormattedFunctionGraphicProperties());
+        createPropertyFragment(
+                "boundaries.xml",
+                "properties related to boundaries",
+                SCHEMA.PROPERTIES,
+                getFormattedBoundaryProperties());
+        createPropertyFragment(
+                "ideographs.xml",
+                "properties related to ideographs",
+                SCHEMA.PROPERTIES,
+                getFormattedIdeographProperties());
+        createPropertyFragment(
+                "miscellaneous.xml",
+                "miscellaneous properties",
+                SCHEMA.PROPERTIES,
+                getFormattedMiscellaneousProperties());
+        createPropertyFragment(
+                "Unihan.xml",
+                "Unihan properties",
+                SCHEMA.PROPERTIES,
+                getFormattedUnihanProperties());
+        createPropertyFragment(
+                "Tangut.xml", "Tangut data", SCHEMA.TANGUT, getFormattedTangutProperties());
+        createPropertyFragment(
+                "Nushu.xml", "Nushu data", SCHEMA.NUSHU, getFormattedNushuProperties());
+        createPropertyFragment(
+                "Emoji.xml", "Emoji properties", SCHEMA.EMOJI_DATA, getFormattedEmojiProperties());
+        createPropertyFragment(
+                "do-not-emit.xml",
+                "do-not-emit",
+                SCHEMA.DO_NOT_EMIT,
+                getFormattedDoNotEmit(VALUESOUTPUTTYPE.VALUE_PER_LINE));
+    }
+
+    private static void createPropertyFragment(SCHEMA schema, String formattedFragment)
+            throws IOException {
+        createPropertyFragment(
+                schema.getName() + ".xml", schema.getName(), schema, formattedFragment);
+    }
+
+    private static void createPropertyFragment(
+            UcdProperty ucdProperty, SCHEMA schema, String formattedFragment) throws IOException {
+        createPropertyFragment(
+                ucdProperty.getShortName() + ".xml",
+                ucdProperty.getShortName() + " attribute",
+                schema,
+                formattedFragment);
+    }
+
+    private static void createPropertyFragment(
+            String filename, String title, SCHEMA schema, String formattedFragment)
+            throws IOException {
+        BufferedWriter writer = getFragmentWriter(filename);
+        writer.write(
+                "<?xml version=\"1.0\" encoding=\"UTF-8\"?>"
+                        + NEWLINE
+                        + "<ucdxml:block xmlns:ucdxml=\""
+                        + NAMESPACE
+                        + "\" title=\""
+                        + title
+                        + "\" id='schema."
+                        + schema.getName()
+                        + "'>"
+                        + NEWLINE);
+        writer.write(formattedFragment);
+        writer.write(NEWLINE + "</ucdxml:block>");
+        writer.flush();
+        writer.close();
+    }
+
+    private static BufferedWriter getFragmentWriter(String filename) throws IOException {
+        File fragmentFolder = new File(destinationFolder + File.separator);
+        if (!fragmentFolder.exists()) {
+            if (!fragmentFolder.mkdir()) {
+                throw new IOException();
+            }
+        }
+        File outputFile = new File(fragmentFolder, filename);
+        FileOutputStream fileOutputStream = new FileOutputStream(outputFile);
+        OutputStreamWriter outputStreamWriter =
+                new OutputStreamWriter(fileOutputStream, StandardCharsets.UTF_8);
+        return new BufferedWriter(outputStreamWriter);
+    }
+
+    private static String getFormattedAttribute(
+            UcdProperty ucdProperty, VALUESOUTPUTTYPE valuesoutputtype) {
+        String attributeString = "    attribute " + ucdProperty.getShortName() + " ";
+        List<String> values;
+        StringBuilder stringBuilder = new StringBuilder();
+
+        switch (ucdProperty) {
+            case Age:
+                values = getAgeValues();
+                break;
+            case Block:
+                values = getBlockValues();
+                break;
+            case General_Category:
+                values = getGeneralCategoryValues();
+                break;
+            case Canonical_Combining_Class:
+                values = getCanonicalCombiningClassValues();
+                break;
+            case Bidi_Class:
+                values = getBidirectionalValues();
+                break;
+            case Bidi_Paired_Bracket_Type:
+                values = getBidiPairedBracketTypeValues();
+                break;
+            case Decomposition_Type:
+                values = getDecompositionTypeValues();
+                break;
+            case NFC_Quick_Check:
+                values = getNFCQuickCheckValues();
+                break;
+            case NFD_Quick_Check:
+                values = getNFDQuickCheckValues();
+                break;
+            case NFKC_Quick_Check:
+                values = getNFKCQuickCheckValues();
+                break;
+            case NFKD_Quick_Check:
+                values = getNFKDQuickCheckValues();
+                break;
+            case Numeric_Type:
+                values = getNumericTypeValues();
+                break;
+            case Joining_Type:
+                values = getJoiningTypeValues();
+                break;
+            case Joining_Group:
+                values = getJoiningGroupValues();
+                break;
+            case Line_Break:
+                values = getLineBreakValues();
+                break;
+            case East_Asian_Width:
+                values = getEastAsianWidthValues();
+                break;
+            case Hangul_Syllable_Type:
+                values = getHangulSyllableTypeValues();
+                break;
+            case Indic_Syllabic_Category:
+                values = getIndicSyllabicCategoryValues();
+                break;
+            case Indic_Positional_Category:
+                values = getIndicPositionalCategoryValues();
+                break;
+            case Indic_Conjunct_Break:
+                values = getIndicConjunctBreakValues();
+                break;
+            case Vertical_Orientation:
+                values = getVerticalOrientationValues();
+                break;
+            case Grapheme_Cluster_Break:
+                values = getGraphemeClusterBreakValues();
+                break;
+            case Word_Break:
+                values = getWordBreakValues();
+                break;
+            case Sentence_Break:
+                values = getSentenceBreakValues();
+                break;
+            case Do_Not_Emit_Type:
+                values = getDoNotEmitTypeValues();
+                break;
+
+            default:
+                throw new IllegalStateException(
+                        ucdProperty.getShortName()
+                                + " is not handled by "
+                                + "getFormattedAttribute.");
+        }
+        String formattedValues = formatValues(attributeString.length(), values, valuesoutputtype);
+        stringBuilder
+                .append("  code-point-attributes &amp;=")
+                .append(NEWLINE)
+                .append(attributeString)
+                .append("{ ");
+        if (formattedValues.contains(NEWLINE)) {
+            stringBuilder.append(formattedValues).append(NEWLINE);
+            stringBuilder.append(
+                    String.format("%" + (attributeString.length() + "}?".length()) + "s", "}?"));
+        } else {
+            stringBuilder.append(formattedValues).append(" }?");
+        }
+        return stringBuilder.toString();
+    }
+
+    private static String getFormattedSyntax(UcdProperty ucdProperty) {
+        final PropertyParsingInfo propInfo = PropertyParsingInfo.getPropertyInfo(ucdProperty);
+        if (propInfo.getRegex() == null) {
+            throw new NullPointerException(
+                    "Could not find syntax for " + ucdProperty.getShortName());
+        }
+
+        String attributeString =
+                ucdProperty.getShortName().startsWith("cjk")
+                        ? "    attribute " + ucdProperty.getShortName().substring(2) + " "
+                        : "    attribute " + ucdProperty.getShortName() + " ";
+        String formattedAttributeString;
+        switch (ucdProperty) {
+                // { text }
+            case ISO_Comment:
+                formattedAttributeString = attributeString + "{ text }?";
+                break;
+
+                // { single-code-point }
+            case Equivalent_Unified_Ideograph:
+                formattedAttributeString = attributeString + "{ single-code-point }?";
+                break;
+
+                // { "" | single-code-point }
+            case Bidi_Mirroring_Glyph:
+                formattedAttributeString = attributeString + "{ \"\" | single-code-point }?";
+                break;
+
+                // { "#" | single-code-point }
+            case Bidi_Paired_Bracket:
+            case Simple_Uppercase_Mapping:
+            case Simple_Lowercase_Mapping:
+            case Simple_Titlecase_Mapping:
+            case Simple_Case_Folding:
+                formattedAttributeString = attributeString + "{ \"#\" | single-code-point }?";
+                break;
+
+                // { "#" | zero-or-more-code-points }
+            case Decomposition_Mapping:
+            case NFKC_Casefold:
+            case NFKC_Simple_Casefold:
+                formattedAttributeString =
+                        attributeString + "{ \"#\" | zero-or-more-code-points }?";
+                break;
+
+                // { "#" | one-or-more-code-points }
+            case FC_NFKC_Closure:
+            case Uppercase_Mapping:
+            case Lowercase_Mapping:
+            case Titlecase_Mapping:
+            case Case_Folding:
+                formattedAttributeString = attributeString + "{ \"#\" | one-or-more-code-points }?";
+                break;
+
+                // { "NaN" | RegEx }
+            case Numeric_Value:
+                formattedAttributeString =
+                        attributeString
+                                + "{ \"NaN\" | xsd:string { pattern=\""
+                                + cleanRegex(propInfo.getRegex().toString())
+                                + "\" } }?";
+                break;
+
+                // Special cases
+            case Name:
+                formattedAttributeString =
+                        attributeString
+                                + "{ \"\" |"
+                                + NEWLINE
+                                + "                   \"CJK UNIFIED IDEOGRAPH-#\" |"
+                                + NEWLINE
+                                + "                   \"CJK COMPATIBILITY IDEOGRAPH-#\" |"
+                                + NEWLINE
+                                + "                   \"EGYPTIAN HIEROGLYPH-#\" |"
+                                + NEWLINE
+                                + "                   \"TANGUT IDEOGRAPH-#\" |"
+                                + NEWLINE
+                                + "                   \"KHITAN SMALL SCRIPT CHARACTER-#\" |"
+                                + NEWLINE
+                                + "                   \"NUSHU CHARACTER-#\" |"
+                                + NEWLINE
+                                + "                   xsd:string { pattern=\""
+                                + cleanRegex(propInfo.getRegex().toString())
+                                + "\" }"
+                                + NEWLINE
+                                + "                 }?";
+                break;
+            case Unicode_1_Name:
+                formattedAttributeString =
+                        attributeString
+                                + "{ \"\" | xsd:string { pattern=\""
+                                + cleanRegex(propInfo.getRegex().toString())
+                                + "\" } }?";
+                break;
+            case Script:
+                formattedAttributeString = attributeString + "{ script }?";
+                break;
+            case Script_Extensions:
+                formattedAttributeString = attributeString + "{ list { script + } }?";
+                break;
+            case kTGT_MergedSrc:
+                // Ideally, should be obtained from a TR.
+                String kTGT_MergedSrc =
+                        NEWLINE
+                                + "     { xsd:string {pattern=\"L2008-[0-9A-F]{4,5}(-[0-9]{4,5})?\"}"
+                                + NEWLINE
+                                + "     | xsd:string {pattern=\"L2006-[0-9]{4}\"}"
+                                + NEWLINE
+                                + "     | xsd:string {pattern=\"L1997-[0-9]{4}\"}"
+                                + NEWLINE
+                                + "     | xsd:string {pattern=\"L1986-[0-9]{4}\"}"
+                                + NEWLINE
+                                + "     | xsd:string {pattern=\"S1968-[0-9]{4}\"}"
+                                + NEWLINE
+                                + "     | xsd:string {pattern=\"N1966-[0-9]{3}(-[0-9A-Z]{3,4})?\"}"
+                                + NEWLINE
+                                + "     | xsd:string {pattern=\"H2004-[A-Z]-[0-9]{4}\"}"
+                                + NEWLINE
+                                + "     | xsd:string {pattern=\"L2012-[0-9]{4}\"}"
+                                + NEWLINE
+                                + "     | xsd:string {pattern=\"UTN42-[0-9]{3}\"}"
+                                + NEWLINE
+                                + "     }?";
+                formattedAttributeString = attributeString + kTGT_MergedSrc;
+                break;
+            case kReading:
+                // Ideally, should be obtained from a TR.
+                String kReading = "{ xsd:string }?";
+                formattedAttributeString = attributeString + kReading;
+                break;
+
+            default:
+                formattedAttributeString =
+                        attributeString
+                                + "{ xsd:string { pattern=\""
+                                + cleanRegex(propInfo.getRegex().toString())
+                                + "\" } }?";
+        }
+        return "  code-point-attributes &amp;=" + NEWLINE + formattedAttributeString;
+    }
+
+    private static String getFormattedTR38Syntax(UcdProperty ucdProperty) {
+        // TODO: We should determine whether we still want to show empty values in the XML files.
+        // TODO: See org.unicode.xml.UcdPropertyDetail.isCJKShowIfEmpty()
+        boolean isShowIfEmpty = false;
+        for (UCDPropertyDetail propDetail : UCDPropertyDetail.cjkValues()) {
+            if (propDetail.getUcdProperty().equals(ucdProperty)) {
+                isShowIfEmpty = propDetail.isCJKShowIfEmpty();
+            }
+        }
+
+        String attributeString = " attribute " + ucdProperty.getShortName().substring(2);
+        TR38Details tr38Details = syntaxTR38.get(ucdProperty.name());
+        if (tr38Details == null) {
+            throw new NullPointerException(
+                    "Could not locate details for " + ucdProperty.name() + " in " + TR38URL);
+        }
+        String formattedSyntax = formatTR38Syntax(tr38Details, isShowIfEmpty);
+
+        return "  code-point-attributes &amp;=" + attributeString + NEWLINE + formattedSyntax;
+    }
+
+    private static String getFormattedElement(UcdProperty ucdProperty) {
+        // Currently scoped to UcdProperty.Name_Alias, but might need to handle different
+        // properties.
+        String nameAliasElement = "name-alias";
+        List<String> values = getNameAliasTypeValues();
+        PropertyParsingInfo propInfo = PropertyParsingInfo.getPropertyInfo(ucdProperty);
+
+        String elementString = "    element " + nameAliasElement + " {" + NEWLINE;
+        String attributeAliasString =
+                "      attribute alias { xsd:string { pattern=\""
+                        + cleanRegex(propInfo.getRegex().toString())
+                        + "\" } }?,"
+                        + NEWLINE;
+        String attributeTypeString = "      attribute type  ";
+
+        String formattedValues =
+                formatValues(
+                        attributeTypeString.length(), values, VALUESOUTPUTTYPE.ALPHABETICAL_GROUP);
+
+        return "  code-point-attributes &amp;="
+                + NEWLINE
+                + elementString
+                + attributeAliasString
+                + attributeTypeString
+                + "{ "
+                + formattedValues
+                + NEWLINE
+                + String.format(
+                        "%" + (attributeTypeString.length() + "}? } *".length()) + "s", "}? } *");
+    }
+
+    private static String getFormattedBoolean(UcdProperty ucdProperty) {
+        String attributeString = "    attribute " + ucdProperty.getShortName() + " ";
+
+        return "  code-point-attributes &amp;=" + NEWLINE + attributeString + "{ boolean }?";
+    }
+
+    private static String getFormattedValues(SCHEMA schema, VALUESOUTPUTTYPE valuesoutputtype) {
+        List<String> values = getBinaryValues();
+        String formattedValues = formatValues(2, values, valuesoutputtype);
+        return "  " + schema.getName() + " = " + formattedValues;
+    }
+
+    private static String getFormattedPropertyValues(
+            UcdProperty ucdProperty, VALUESOUTPUTTYPE valuesoutputtype) {
+        List<String> values = getScriptValues();
+        String formattedValues = formatValues(11, values, valuesoutputtype);
+        return "  " + ucdProperty.name().toLowerCase() + " = " + formattedValues;
+    }
+
+    private static String getFormattedDoNotEmit(VALUESOUTPUTTYPE valuesoutputtype) {
+        List<String> values = getDoNotEmitTypeValues();
+        String formattedValues = formatValues(26, values, valuesoutputtype);
+        return "  ucd.content &amp;=\n"
+                + "    element do-not-emit {\n"
+                + "      element instead {\n"
+                + "        attribute of { one-or-more-code-points },\n"
+                + "        attribute use { one-or-more-code-points },\n"
+                + "        attribute because { "
+                + formattedValues
+                + NEWLINE
+                + "      } }+ }?";
+    }
+
+    private static String formatTR38Syntax(TR38Details tr38Details, boolean isShowIfEmpty) {
+        // TODO: We should determine whether we still want to show empty values in the XML files.
+        // TODO: See org.unicode.xml.UcdPropertyDetail.isCJKShowIfEmpty()
+        boolean isList = tr38Details.isList();
+        String syntax = cleanRegex(tr38Details.getSyntax());
+        // This is a kludge as it depends on only having single OR double quotes in the syntax. If
+        // we have both, we'll
+        // need to do more investigation on what RELAXNG Compact supports.
+        String QUOTMARK = syntax.contains("\"") ? "'" : "\"";
+
+        boolean hasNewlines = syntax.contains("\n");
+        if (hasNewlines) {
+            int indent;
+            String firstLinePrefix;
+            String ending = isList ? "    )+}}?" : "    }?";
+            if (isShowIfEmpty) {
+                indent = (isList ? 15 : 8);
+                firstLinePrefix = isList ? "    { \"\" | list { " : "    { \"\" | ";
+            } else {
+                indent = (isList ? 12 : 4);
+                firstLinePrefix = isList ? "    { list { ( " : "    { ";
+            }
+            String padding = String.format("%" + indent + "s", "");
+            StringBuilder formattedSyntaxBuilder = new StringBuilder();
+            Pattern syntaxPattern = Pattern.compile("([^\r\n]+)");
+            Matcher matcher = syntaxPattern.matcher(syntax);
+            while (matcher.find()) {
+                if (formattedSyntaxBuilder.length() == 0) {
+                    // First line
+                    formattedSyntaxBuilder
+                            .append(firstLinePrefix)
+                            .append("xsd:string { pattern=")
+                            .append(QUOTMARK)
+                            .append(matcher.group(1))
+                            .append(QUOTMARK)
+                            .append(" }")
+                            .append(NEWLINE);
+                } else {
+                    // Everything else
+                    formattedSyntaxBuilder
+                            .append(padding)
+                            .append(
+                                    matcher.group(1)
+                                            .replaceAll(
+                                                    "^[| ]*",
+                                                    " | xsd:string { pattern=" + QUOTMARK))
+                            .append(QUOTMARK)
+                            .append(" }")
+                            .append(NEWLINE);
+                }
+            }
+            formattedSyntaxBuilder.append(ending);
+            return formattedSyntaxBuilder.toString();
+
+        } else {
+            if (isShowIfEmpty) {
+                if (isList) {
+                    return "    { \"\" | list { xsd:string { pattern="
+                            + QUOTMARK
+                            + syntax
+                            + QUOTMARK
+                            + " }+ } }?";
+                } else {
+                    return "    { \"\" | xsd:string { pattern="
+                            + QUOTMARK
+                            + syntax
+                            + QUOTMARK
+                            + " } }?";
+                }
+            } else {
+                if (isList) {
+                    return "    { list { xsd:string { pattern="
+                            + QUOTMARK
+                            + syntax
+                            + QUOTMARK
+                            + " }+ } }?";
+                } else {
+                    return "    { xsd:string { pattern=" + QUOTMARK + syntax + QUOTMARK + " } }?";
+                }
+            }
+        }
+    }
+
+    private static String formatValues(
+            int indent, List<String> values, VALUESOUTPUTTYPE valuesoutputtype) {
+        StringBuilder valueBlock = new StringBuilder();
+        StringBuilder currentLine = new StringBuilder();
+        String padding = String.format("%" + indent + "s", "");
+        String groupPrefix = "";
+        for (String value : values) {
+            StringBuilder formattedValue = new StringBuilder();
+            if (valueBlock.length() > 0 || currentLine.length() > 0) {
+                formattedValue.append("| ");
+            }
+            if (value.startsWith("xsd")) {
+                formattedValue.append(value);
+            } else {
+                formattedValue.append("\"").append(value).append("\"");
+            }
+
+            switch (valuesoutputtype) {
+                case NUMERICAL_GROUP:
+                case ALPHABETICAL_GROUP:
+                    String valuePrefix = getValuePrefix(value, valuesoutputtype);
+                    if (groupPrefix.isEmpty()) {
+                        currentLine.append(formattedValue);
+                        groupPrefix = valuePrefix;
+                    } else if (valuePrefix.equals(groupPrefix)) {
+                        int testLength =
+                                valueBlock.length() == 0
+                                        ? padding.length() + currentLine.length() + " ".length()
+                                        : currentLine.length() + " ".length();
+                        if ((testLength + formattedValue.length()) > MAX_LINE_LENGTH) {
+                            valueBlock.append(currentLine).append(NEWLINE);
+                            currentLine.setLength(0);
+                            currentLine.append(padding).append(formattedValue);
+                        } else {
+                            if (currentLine.length() > 0) {
+                                currentLine.append(" ");
+                            }
+                            currentLine.append(formattedValue);
+                        }
+                    } else {
+                        valueBlock.append(currentLine).append(NEWLINE);
+                        currentLine.setLength(0);
+                        currentLine.append(padding).append(formattedValue);
+                        groupPrefix = valuePrefix;
+                    }
+                    break;
+
+                case MAX_LINE_LENGTH:
+                    int testLength =
+                            valueBlock.length() == 0
+                                    ? padding.length() + currentLine.length() + " ".length()
+                                    : currentLine.length() + " ".length();
+                    if ((testLength + formattedValue.length()) > MAX_LINE_LENGTH) {
+                        valueBlock.append(currentLine).append(NEWLINE);
+                        currentLine.setLength(0);
+                        currentLine.append(padding).append(formattedValue);
+                    } else {
+                        if (currentLine.length() > 0) {
+                            currentLine.append(" ");
+                        }
+                        currentLine.append(formattedValue);
+                    }
+                    break;
+
+                case VALUE_PER_LINE:
+                default:
+                    if (valueBlock.length() > 0) {
+                        valueBlock.append(NEWLINE).append(padding).append("| ");
+                    }
+                    if (value.startsWith("xsd")) {
+                        valueBlock.append(value);
+                    } else {
+                        valueBlock.append("\"").append(value).append("\"");
+                    }
+            }
+        }
+        valueBlock.append(currentLine);
+        return valueBlock.toString();
+    }
+
+    private static String getValuePrefix(String value, VALUESOUTPUTTYPE valuesoutputtype) {
+        if (valuesoutputtype == VALUESOUTPUTTYPE.ALPHABETICAL_GROUP) {
+            return value.substring(0, 1);
+        }
+        if (valuesoutputtype == VALUESOUTPUTTYPE.NUMERICAL_GROUP) {
+            if (value.contains(".")) {
+                return value.substring(0, value.indexOf("."));
+            } else {
+                // String value in list of numbers. See Age_Values for an example.
+                return value;
+            }
+        } else {
+            throw new IllegalArgumentException();
+        }
+    }
+
+    private static String cleanRegex(String regex) {
+        return regex.replaceAll("\\[-", "[\\\\-").replaceAll("\\\\/", "/").replaceAll("\\\\'", "'");
+    }
+
+    // ********************* Combined properties ********************//
+
+    private static String getFormattedDecompositionProperties() {
+        return getFormattedAttribute(
+                        UcdProperty.Decomposition_Type, VALUESOUTPUTTYPE.MAX_LINE_LENGTH)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.Decomposition_Mapping);
+    }
+
+    private static String getFormattedCompositionProperties() {
+        return getFormattedBoolean(UcdProperty.Composition_Exclusion)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Full_Composition_Exclusion);
+    }
+
+    private static String getFormattedQuickCheckProperties() {
+        return getFormattedAttribute(UcdProperty.NFC_Quick_Check, VALUESOUTPUTTYPE.MAX_LINE_LENGTH)
+                + DOUBLELINE
+                + getFormattedAttribute(
+                        UcdProperty.NFD_Quick_Check, VALUESOUTPUTTYPE.MAX_LINE_LENGTH)
+                + DOUBLELINE
+                + getFormattedAttribute(
+                        UcdProperty.NFKC_Quick_Check, VALUESOUTPUTTYPE.MAX_LINE_LENGTH)
+                + DOUBLELINE
+                + getFormattedAttribute(
+                        UcdProperty.NFKD_Quick_Check, VALUESOUTPUTTYPE.MAX_LINE_LENGTH)
+                + TRIPLELINE
+                + getFormattedBoolean(UcdProperty.Expands_On_NFC)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Expands_On_NFD)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Expands_On_NFKC)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Expands_On_NFKD)
+                + TRIPLELINE
+                + getFormattedSyntax(UcdProperty.FC_NFKC_Closure);
+    }
+
+    private static String getFormattedNumericProperties() {
+        return getFormattedAttribute(UcdProperty.Numeric_Type, VALUESOUTPUTTYPE.MAX_LINE_LENGTH)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.Numeric_Value);
+    }
+
+    private static String getFormattedJoiningProperties() {
+        return getFormattedAttribute(UcdProperty.Joining_Type, VALUESOUTPUTTYPE.MAX_LINE_LENGTH)
+                + DOUBLELINE
+                + getFormattedAttribute(
+                        UcdProperty.Joining_Group, VALUESOUTPUTTYPE.ALPHABETICAL_GROUP);
+    }
+
+    private static String getFormattedCasingProperties() {
+        return getFormattedBoolean(UcdProperty.Uppercase)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Lowercase)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Other_Uppercase)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Other_Lowercase);
+    }
+
+    private static String getFormattedSimpleCaseMappingProperties() {
+        return getFormattedSyntax(UcdProperty.Simple_Uppercase_Mapping)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.Simple_Lowercase_Mapping)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.Simple_Titlecase_Mapping);
+    }
+
+    private static String getFormattedCaseMappingProperties() {
+        return getFormattedSyntax(UcdProperty.Uppercase_Mapping)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.Lowercase_Mapping)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.Titlecase_Mapping);
+    }
+
+    private static String getFormattedCaseFoldingProperties() {
+        return getFormattedSyntax(UcdProperty.Simple_Case_Folding)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.Case_Folding);
+    }
+
+    private static String getFormattedCaseOtherProperties() {
+        return getFormattedBoolean(UcdProperty.Case_Ignorable)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Cased)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Changes_When_Casefolded)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Changes_When_Casemapped)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Changes_When_Lowercased)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Changes_When_NFKC_Casefolded)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Changes_When_Titlecased)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Changes_When_Uppercased)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.NFKC_Casefold)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.NFKC_Simple_Casefold);
+    }
+
+    private static String getFormattedScriptProperties() {
+        return getFormattedPropertyValues(UcdProperty.Script, VALUESOUTPUTTYPE.ALPHABETICAL_GROUP)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.Script)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.Script_Extensions);
+    }
+
+    private static String getFormattedIdentifierProperties() {
+        return getFormattedBoolean(UcdProperty.ID_Start)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Other_ID_Start)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.XID_Start)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.ID_Continue)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Other_ID_Continue)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.XID_Continue)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.ID_Compat_Math_Start)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.ID_Compat_Math_Continue);
+    }
+
+    private static String getFormattedPatternProperties() {
+        return getFormattedBoolean(UcdProperty.Pattern_Syntax)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Pattern_White_Space);
+    }
+
+    private static String getFormattedFunctionGraphicProperties() {
+        return getFormattedBoolean(UcdProperty.Dash)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Hyphen)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Quotation_Mark)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Terminal_Punctuation)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Sentence_Terminal)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Diacritic)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Extender)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Soft_Dotted)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Alphabetic)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Other_Alphabetic)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Math)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Other_Math)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Hex_Digit)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.ASCII_Hex_Digit)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Default_Ignorable_Code_Point)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Other_Default_Ignorable_Code_Point)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Logical_Order_Exception)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Prepended_Concatenation_Mark)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Modifier_Combining_Mark)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.White_Space)
+                + DOUBLELINE
+                + getFormattedAttribute(
+                        UcdProperty.Vertical_Orientation, VALUESOUTPUTTYPE.MAX_LINE_LENGTH)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Regional_Indicator);
+    }
+
+    private static String getFormattedBoundaryProperties() {
+        return getFormattedBoolean(UcdProperty.Grapheme_Base)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Grapheme_Extend)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Other_Grapheme_Extend)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Grapheme_Link)
+                + DOUBLELINE
+                + getFormattedAttribute(
+                        UcdProperty.Grapheme_Cluster_Break, VALUESOUTPUTTYPE.ALPHABETICAL_GROUP)
+                + DOUBLELINE
+                + getFormattedAttribute(UcdProperty.Word_Break, VALUESOUTPUTTYPE.ALPHABETICAL_GROUP)
+                + DOUBLELINE
+                + getFormattedAttribute(
+                        UcdProperty.Sentence_Break, VALUESOUTPUTTYPE.ALPHABETICAL_GROUP);
+    }
+
+    private static String getFormattedIdeographProperties() {
+        return getFormattedBoolean(UcdProperty.Ideographic)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Unified_Ideograph)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.Equivalent_Unified_Ideograph)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.IDS_Binary_Operator)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.IDS_Trinary_Operator)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.IDS_Unary_Operator)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Radical);
+    }
+
+    private static String getFormattedMiscellaneousProperties() {
+        return getFormattedBoolean(UcdProperty.Deprecated)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Variation_Selector)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Noncharacter_Code_Point);
+    }
+
+    private static String getFormattedUnihanProperties() {
+        return getFormattedTR38Syntax(UcdProperty.kAccountingNumeric)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kAlternateTotalStrokes)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kBigFive)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kCangjie)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kCantonese)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kCCCII)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kCheungBauer)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kCheungBauerIndex)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kCihaiT)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kCNS1986)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kCNS1992)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kCompatibilityVariant)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kCowles)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kDaeJaweon)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kDefinition)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kEACC)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kFanqie)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kFenn)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kFennIndex)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kFourCornerCode)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kGB0)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kGB1)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kGB3)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kGB5)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kGB7)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kGB8)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kGradeLevel)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kGSR)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kHangul)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kHanYu)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kHanyuPinlu)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kHanyuPinyin)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kHDZRadBreak)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kHKGlyph)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIBMJapan)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIICore)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRG_GSource)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRG_HSource)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRG_JSource)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRG_KPSource)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRG_KSource)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRG_MSource)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRG_SSource)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRG_TSource)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRG_UKSource)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRG_USource)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRG_VSource)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRGDaeJaweon)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRGHanyuDaZidian)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kIRGKangXi)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kJa)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kJapanese)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kJapaneseKun)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kJapaneseOn)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kJinmeiyoKanji)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kJis0)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kJis1)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kJIS0213)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kJoyoKanji)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kKangXi)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kKarlgren)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kKorean)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kKoreanEducationHanja)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kKoreanName)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kLau)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kMainlandTelegraph)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kMandarin)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kMatthews)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kMeyerWempe)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kMojiJoho)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kMorohashi)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kNelson)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kOtherNumeric)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kPhonetic)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kPrimaryNumeric)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kPseudoGB1)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kRSAdobe_Japan1_6)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kRSUnicode)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kSBGY)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kSemanticVariant)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kSimplifiedVariant)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kSMSZD2003Index)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kSMSZD2003Readings)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kSpecializedSemanticVariant)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kSpoofingVariant)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kStrange)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kTaiwanTelegraph)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kTang)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kTGH)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kTGHZ2013)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kTotalStrokes)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kTraditionalVariant)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kUnihanCore2020)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kVietnamese)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kVietnameseNumeric)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kXerox)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kXHC1983)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kZhuang)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kZhuangNumeric)
+                + DOUBLELINE
+                + getFormattedTR38Syntax(UcdProperty.kZVariant);
+    }
+
+    private static String getFormattedTangutProperties() {
+        return getFormattedSyntax(UcdProperty.kRSTUnicode)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.kTGT_MergedSrc);
+    }
+
+    private static String getFormattedNushuProperties() {
+        return getFormattedSyntax(UcdProperty.kSrc_NushuDuben)
+                + DOUBLELINE
+                + getFormattedSyntax(UcdProperty.kReading);
+    }
+
+    private static String getFormattedEmojiProperties() {
+        return getFormattedBoolean(UcdProperty.Emoji)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Emoji_Presentation)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Emoji_Modifier)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Emoji_Modifier_Base)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Emoji_Component)
+                + DOUBLELINE
+                + getFormattedBoolean(UcdProperty.Extended_Pictographic);
+    }
+
+    // ********************* Attribute values ********************//
+
+    private static List<String> getBinaryValues() {
+        List<String> values = new ArrayList<>();
+        for (Binary binaryValues : Binary.values()) {
+            values.add(binaryValues.getShortName());
+        }
+        // Binary should display as Y | N.
+        values.sort(Collections.reverseOrder());
+        return values;
+    }
+
+    private static List<String> getAgeValues() {
+        List<String> values = new ArrayList<>();
+        for (Age_Values ageValues : Age_Values.values()) {
+            String shortName = ageValues.getShortName();
+            if (shortName.equals("NA")) {
+                values.add("unassigned");
+            } else if (shortName.equals("13.1")) {
+                // https://github.com/unicode-org/unicodetools/issues/100
+            } else {
+                values.add(shortName);
+            }
+        }
+        return values;
+    }
+
+    private static List<String> getNameAliasTypeValues() {
+        List<String> values = new ArrayList<>();
+        for (AttributeResolver.AliasType aliastypeValues : AttributeResolver.AliasType.values()) {
+            if (!aliastypeValues.equals(AttributeResolver.AliasType.NONE)) {
+                values.add(aliastypeValues.toString());
+            }
+        }
+        return values;
+    }
+
+    private static List<String> getBlockValues() {
+        List<String> values = new ArrayList<>();
+        for (Block_Values blockValues : Block_Values.values()) {
+            values.add(blockValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getGeneralCategoryValues() {
+        List<String> values = new ArrayList<>();
+        for (General_Category_Values generalCategoryValues : General_Category_Values.values()) {
+            if (!generalCategoryValues
+                    .getShortName()
+                    .toUpperCase()
+                    .equals(generalCategoryValues.getShortName())) {
+                // Some of the General_Category_Values (LC, L, M, N, P, S, Z, C) stand for grouping
+                // of related
+                // General_Category values. They won't occur on any individual code point, so can be
+                // ignored.
+                values.add(generalCategoryValues.getShortName());
+            }
+        }
+        return values;
+    }
+
+    private static List<String> getCanonicalCombiningClassValues() {
+        List<String> values = new ArrayList<>();
+        values.add("xsd:integer { minInclusive=\"0\" maxInclusive=\"254\" }");
+        // Because the set of values that this property has taken across the various versions of the
+        // UCD is rather
+        // large, our schema does not restrict the possible values to those actually used.
+        // for (Canonical_Combining_Class_Values canonicalCombiningClassValues :
+        //        Canonical_Combining_Class_Values.values()) {
+        //    values.add(canonicalCombiningClassValues.getShortName());
+        // }
+        return values;
+    }
+
+    private static List<String> getBidirectionalValues() {
+        List<String> values = new ArrayList<>();
+        for (Bidi_Class_Values bidiClassValues : Bidi_Class_Values.values()) {
+            values.add(bidiClassValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getBidiPairedBracketTypeValues() {
+        List<String> values = new ArrayList<>();
+        // Order should be Open/Close/None
+        values.add(Bidi_Paired_Bracket_Type_Values.Open.getShortName());
+        values.add(Bidi_Paired_Bracket_Type_Values.Close.getShortName());
+        values.add(Bidi_Paired_Bracket_Type_Values.None.getShortName());
+        // Now let's check to see if there is anything else that we didn't expect
+        for (Bidi_Paired_Bracket_Type_Values bidiPairedBracketTypeValue :
+                Bidi_Paired_Bracket_Type_Values.values()) {
+            if (!values.contains(bidiPairedBracketTypeValue.getShortName())) {
+                throw new IllegalArgumentException();
+            }
+        }
+        return values;
+    }
+
+    private static List<String> getDecompositionTypeValues() {
+        List<String> values = new ArrayList<>();
+        for (Decomposition_Type_Values decompositionTypeValues :
+                Decomposition_Type_Values.values()) {
+            // We want "none" to be last.
+            if (decompositionTypeValues != Decomposition_Type_Values.None) {
+                values.add(decompositionTypeValues.getNames().getOtherNames().get(0));
+            }
+        }
+        values.add(Decomposition_Type_Values.None.getNames().getOtherNames().get(0));
+        return values;
+    }
+
+    private static List<String> getNFCQuickCheckValues() {
+        List<String> values = new ArrayList<>();
+        // Order should be Yes/No/Maybe
+        values.add(NFC_Quick_Check_Values.Yes.getShortName());
+        values.add(NFC_Quick_Check_Values.No.getShortName());
+        values.add(NFC_Quick_Check_Values.Maybe.getShortName());
+        // Now let's check to see if there is anything else that we didn't expect
+        for (NFC_Quick_Check_Values nfcQuickCheckValues : NFC_Quick_Check_Values.values()) {
+            if (!values.contains(nfcQuickCheckValues.getShortName())) {
+                throw new IllegalArgumentException();
+            }
+        }
+        return values;
+    }
+
+    private static List<String> getNFDQuickCheckValues() {
+        List<String> values = new ArrayList<>();
+        // Order should be Yes/No
+        values.add(NFD_Quick_Check_Values.Yes.getShortName());
+        values.add(NFD_Quick_Check_Values.No.getShortName());
+        // Now let's check to see if there is anything else that we didn't expect
+        for (NFD_Quick_Check_Values nfdQuickCheckValues : NFD_Quick_Check_Values.values()) {
+            if (!values.contains(nfdQuickCheckValues.getShortName())) {
+                throw new IllegalArgumentException();
+            }
+        }
+        return values;
+    }
+
+    private static List<String> getNFKCQuickCheckValues() {
+        List<String> values = new ArrayList<>();
+        // Order should be Yes/No/Maybe
+        values.add(NFKC_Quick_Check_Values.Yes.getShortName());
+        values.add(NFKC_Quick_Check_Values.No.getShortName());
+        values.add(NFKC_Quick_Check_Values.Maybe.getShortName());
+        // Now let's check to see if there is anything else that we didn't expect
+        for (NFKC_Quick_Check_Values nfkcQuickCheckValues : NFKC_Quick_Check_Values.values()) {
+            if (!values.contains(nfkcQuickCheckValues.getShortName())) {
+                throw new IllegalArgumentException();
+            }
+        }
+        return values;
+    }
+
+    private static List<String> getNFKDQuickCheckValues() {
+        List<String> values = new ArrayList<>();
+        // Order should be Yes/No
+        values.add(NFKD_Quick_Check_Values.Yes.getShortName());
+        values.add(NFKD_Quick_Check_Values.No.getShortName());
+        // Now let's check to see if there is anything else that we didn't expect
+        for (NFKD_Quick_Check_Values nfkdQuickCheckValues : NFKD_Quick_Check_Values.values()) {
+            if (!values.contains(nfkdQuickCheckValues.getShortName())) {
+                throw new IllegalArgumentException();
+            }
+        }
+        return values;
+    }
+
+    private static List<String> getNumericTypeValues() {
+        List<String> values = new ArrayList<>();
+        // Order should be Decimal/Digit/Numeric/None
+        values.add(Numeric_Type_Values.Decimal.getShortName());
+        values.add(Numeric_Type_Values.Digit.getShortName());
+        values.add(Numeric_Type_Values.Numeric.getShortName());
+        values.add(Numeric_Type_Values.None.getShortName());
+        // Now let's check to see if there is anything else that we didn't expect
+        for (Numeric_Type_Values numericTypeValues : Numeric_Type_Values.values()) {
+            if (!values.contains(numericTypeValues.getShortName())) {
+                throw new IllegalArgumentException();
+            }
+        }
+        return values;
+    }
+
+    private static List<String> getJoiningTypeValues() {
+        List<String> values = new ArrayList<>();
+        for (Joining_Type_Values joiningTypeValues : Joining_Type_Values.values()) {
+            values.add(joiningTypeValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getJoiningGroupValues() {
+        List<String> values = new ArrayList<>();
+        for (Joining_Group_Values joiningGroupValues : Joining_Group_Values.values()) {
+            values.add(joiningGroupValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getLineBreakValues() {
+        List<String> values = new ArrayList<>();
+        for (Line_Break_Values lineBreakValues : Line_Break_Values.values()) {
+            values.add(lineBreakValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getEastAsianWidthValues() {
+        List<String> values = new ArrayList<>();
+        for (East_Asian_Width_Values eastAsianWidthValues : East_Asian_Width_Values.values()) {
+            values.add(eastAsianWidthValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getScriptValues() {
+        List<Script_Values> excludedValues =
+                Arrays.asList(
+                        Script_Values.Han_with_Bopomofo,
+                        Script_Values.Japanese,
+                        Script_Values.Korean,
+                        Script_Values.Math_Symbols,
+                        Script_Values.Emoji_Symbols,
+                        Script_Values.Other_Symbols,
+                        Script_Values.Unwritten);
+        List<String> values = new ArrayList<>();
+        for (Script_Values scriptValue : Script_Values.values()) {
+            if (!excludedValues.contains(scriptValue)) {
+                values.add(scriptValue.getShortName());
+            }
+            // Include the following if you want to add other names
+            // if (!scriptValue.getNames().getOtherNames().isEmpty()) {
+            //    values.add(scriptValue.getNames().getOtherNames().get(0));
+            // }
+        }
+        Collections.sort(values);
+        return values;
+    }
+
+    private static List<String> getHangulSyllableTypeValues() {
+        List<String> values = new ArrayList<>();
+        for (Hangul_Syllable_Type_Values hangulSyllableTypeValues :
+                Hangul_Syllable_Type_Values.values()) {
+            values.add(hangulSyllableTypeValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getIndicSyllabicCategoryValues() {
+        List<String> values = new ArrayList<>();
+        for (Indic_Syllabic_Category_Values indicSyllabicCategoryValues :
+                Indic_Syllabic_Category_Values.values()) {
+            values.add(indicSyllabicCategoryValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getIndicPositionalCategoryValues() {
+        List<String> values = new ArrayList<>();
+        for (Indic_Positional_Category_Values indicPositionalCategoryValues :
+                Indic_Positional_Category_Values.values()) {
+            values.add(indicPositionalCategoryValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getIndicConjunctBreakValues() {
+        List<String> values = new ArrayList<>();
+        for (Indic_Conjunct_Break_Values indicConjunctBreakValues :
+                Indic_Conjunct_Break_Values.values()) {
+            values.add(indicConjunctBreakValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getVerticalOrientationValues() {
+        List<String> values = new ArrayList<>();
+        for (Vertical_Orientation_Values verticalOrientationValues :
+                Vertical_Orientation_Values.values()) {
+            values.add(verticalOrientationValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getGraphemeClusterBreakValues() {
+        List<String> values = new ArrayList<>();
+        for (Grapheme_Cluster_Break_Values graphemeClusterBreakValues :
+                Grapheme_Cluster_Break_Values.values()) {
+            values.add(graphemeClusterBreakValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getWordBreakValues() {
+        List<String> values = new ArrayList<>();
+        for (Word_Break_Values wordBreakValues : Word_Break_Values.values()) {
+            values.add(wordBreakValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getSentenceBreakValues() {
+        List<String> values = new ArrayList<>();
+        for (Sentence_Break_Values sentenceBreakValues : Sentence_Break_Values.values()) {
+            values.add(sentenceBreakValues.getShortName());
+        }
+        return values;
+    }
+
+    private static List<String> getDoNotEmitTypeValues() {
+        List<String> values = new ArrayList<>();
+        for (Do_Not_Emit_Type_Values doNotEmitTypeValues : Do_Not_Emit_Type_Values.values()) {
+            values.add(doNotEmitTypeValues.getShortName());
+        }
+        Collections.sort(values);
+        return values;
+    }
+
+    // ********************* Utility methods ********************//
+
+    private static HashMap<String, TR38Details> parseTR38() throws IOException, URISyntaxException {
+        HashMap<String, TR38Details> syntaxTR38 = new HashMap<>();
+        URI uri = new URI(TR38URL);
+        StringBuilder stringBuilder = new StringBuilder();
+        try (InputStream is = uri.toURL().openStream()) {
+            int ptr = 0;
+            while ((ptr = is.read()) != -1) {
+                stringBuilder.append((char) ptr);
+            }
+        }
+        Pattern syntaxPattern =
+                Pattern.compile(
+                        ">Property</td>.*?<strong>(.*?)</strong>.*?>Delimiter</td>.*?>(.*?)</td>.*?>Syntax</td>.*?>(.*?)</td>",
+                        Pattern.DOTALL);
+        Matcher matcher = syntaxPattern.matcher(stringBuilder.toString());
+        while (matcher.find()) {
+            String delimiter = matcher.group(2).trim();
+            boolean isList = false;
+            switch (delimiter) {
+                case "N/A":
+                    break;
+                case "space":
+                    isList = true;
+                    break;
+                default:
+                    throw new IllegalArgumentException(
+                            "Only \"space\" or \"N/A\" are supported values for Delimiter."
+                                    + " Found: "
+                                    + delimiter);
+            }
+            TR38Details tr38Details =
+                    new TR38Details(isList, matcher.group(3).trim().replaceAll("<br>", ""));
+            syntaxTR38.put(matcher.group(1).trim(), tr38Details);
+        }
+        return syntaxTR38;
+    }
+}
diff --git a/unicodetools/src/main/java/org/unicode/xml/UCDDataResolver.java b/unicodetools/src/main/java/org/unicode/xml/UCDDataResolver.java
new file mode 100644
index 000000000..d607a661f
--- /dev/null
+++ b/unicodetools/src/main/java/org/unicode/xml/UCDDataResolver.java
@@ -0,0 +1,214 @@
+package org.unicode.xml;
+
+import com.ibm.icu.util.VersionInfo;
+import java.util.ArrayList;
+import java.util.Collections;
+import java.util.HashMap;
+import java.util.List;
+import org.unicode.cldr.draft.FileUtilities;
+import org.unicode.props.IndexUnicodeProperties;
+import org.unicode.props.PropertyParsingInfo;
+import org.unicode.props.UcdLineParser;
+import org.xml.sax.SAXException;
+import org.xml.sax.helpers.AttributesImpl;
+
+/** Helper class for building sections of UCDXML files based on IndexUnicodeProperties values. */
+public class UCDDataResolver {
+
+    private final IndexUnicodeProperties indexUnicodeProperties;
+    private final String namespace;
+    private final UCDXMLWriter writer;
+
+    public UCDDataResolver(IndexUnicodeProperties iup, String namespace, UCDXMLWriter writer) {
+        indexUnicodeProperties = iup;
+        this.namespace = namespace;
+        this.writer = writer;
+    }
+
+    public void buildSection(UCDSectionDetail.UcdSection ucdSection) throws SAXException {
+        VersionInfo minVersion = ucdSection.getMinVersion();
+        VersionInfo maxVersion = ucdSection.getMaxVersion();
+        String tag = ucdSection.toString();
+        String childTag = ucdSection.getChildTag();
+        boolean parserWithRange = ucdSection.getParserWithRange();
+        boolean parserWithMissing = ucdSection.getParserWithMissing();
+        UCDSectionComponent[] ucdSectionComponents =
+                ucdSection.getUcdSectionDetail().getUcdSectionComponents();
+
+        if (isCompatibleVersion(minVersion, maxVersion)) {
+            writer.startElement(tag);
+            {
+                for (UCDSectionComponent ucdSectionComponent : ucdSectionComponents) {
+                    if (isCompatibleVersion(
+                            ucdSectionComponent.getMinVersion(),
+                            ucdSectionComponent.getMaxVersion())) {
+                        final PropertyParsingInfo fileInfoEVS =
+                                PropertyParsingInfo.getPropertyInfo(
+                                        ucdSectionComponent.getUcdProperty());
+                        String fullFilename =
+                                fileInfoEVS.getFullFileName(indexUnicodeProperties.getUcdVersion());
+                        UcdLineParser parser =
+                                new UcdLineParser(FileUtilities.in("", fullFilename));
+                        parser.withRange(parserWithRange);
+                        parser.withMissing(parserWithMissing);
+                        switch (ucdSection) {
+                            case BLOCKS:
+                                for (UcdLineParser.UcdLine line : parser) {
+                                    if (!line.getOriginalLine().startsWith("#")) {
+                                        AttributesImpl attributes =
+                                                getBlockAttributes(namespace, line);
+                                        writer.startElement(childTag, attributes);
+                                        {
+                                            writer.endElement(childTag);
+                                        }
+                                    }
+                                }
+                                break;
+                            case NAMEDSEQUENCES:
+                                HashMap<String, String> namedSequences = new HashMap<>();
+                                for (UcdLineParser.UcdLine line : parser) {
+                                    String[] parts = line.getParts();
+                                    namedSequences.put(parts[0], parts[1]);
+                                }
+                                List<String> names = new ArrayList<>(namedSequences.keySet());
+                                Collections.sort(names);
+                                for (String name : names) {
+                                    AttributesImpl attributes =
+                                            getNamedSequenceAttributes(
+                                                    namespace, name, namedSequences);
+                                    writer.startElement(childTag, attributes);
+                                    {
+                                        writer.endElement(childTag);
+                                    }
+                                }
+                                break;
+                            case PROVISIONALNAMEDSEQUENCES:
+                                HashMap<String, String> provisionalNamedSequences = new HashMap<>();
+                                for (UcdLineParser.UcdLine line : parser) {
+                                    String[] parts = line.getParts();
+                                    provisionalNamedSequences.put(parts[0], parts[1]);
+                                }
+                                List<String> psNames =
+                                        new ArrayList<>(provisionalNamedSequences.keySet());
+                                Collections.sort(psNames);
+                                for (String name : psNames) {
+                                    AttributesImpl attributes =
+                                            getNamedSequenceAttributes(
+                                                    namespace, name, provisionalNamedSequences);
+                                    writer.startElement(childTag, attributes);
+                                    {
+                                        writer.endElement(childTag);
+                                    }
+                                }
+                                break;
+                            default:
+                                for (UcdLineParser.UcdLine line : parser) {
+                                    AttributesImpl attributes =
+                                            getAttributes(ucdSection, namespace, line);
+                                    writer.startElement(childTag, attributes);
+                                    {
+                                        writer.endElement(childTag);
+                                    }
+                                }
+                        }
+                    }
+                }
+                writer.endElement(tag);
+            }
+        }
+    }
+
+    private AttributesImpl getAttributes(
+            UCDSectionDetail.UcdSection ucdSection, String namespace, UcdLineParser.UcdLine line) {
+        switch (ucdSection) {
+            case CJKRADICALS:
+                return getCJKRadicalAttributes(namespace, line);
+            case DONOTEMIT:
+                return getDoNotEmitAttributes(namespace, line);
+            case EMOJISOURCES:
+                return getEmojiSourceAttributes(namespace, line);
+            case NORMALIZATIONCORRECTIONS:
+                return getNCAttributes(namespace, line);
+            case STANDARDIZEDVARIANTS:
+                return getSVAttributes(namespace, line);
+            default:
+                throw new IllegalArgumentException(
+                        "getAttributes failed on an unexpected UcdSection");
+        }
+    }
+
+    private static AttributesImpl getBlockAttributes(String namespace, UcdLineParser.UcdLine line) {
+        String[] parts = line.getParts();
+        String[] range = parts[0].split("\\.\\.");
+        AttributesImpl attributes = new AttributesImpl();
+        attributes.addAttribute(namespace, "first-cp", "first-cp", "CDATA", range[0]);
+        attributes.addAttribute(namespace, "last-cp", "last-cp", "CDATA", range[1]);
+        attributes.addAttribute(namespace, "name", "name", "CDATA", parts[1]);
+        return attributes;
+    }
+
+    private static AttributesImpl getCJKRadicalAttributes(
+            String namespace, UcdLineParser.UcdLine line) {
+        String[] parts = line.getParts();
+        AttributesImpl attributes = new AttributesImpl();
+        attributes.addAttribute(namespace, "number", "number", "CDATA", parts[0]);
+        attributes.addAttribute(namespace, "radical", "radical", "CDATA", parts[1]);
+        attributes.addAttribute(namespace, "ideograph", "ideograph", "CDATA", parts[2]);
+        return attributes;
+    }
+
+    private static AttributesImpl getDoNotEmitAttributes(
+            String namespace, UcdLineParser.UcdLine line) {
+        String[] parts = line.getParts();
+        AttributesImpl attributes = new AttributesImpl();
+        attributes.addAttribute(namespace, "of", "of", "CDATA", parts[0]);
+        attributes.addAttribute(namespace, "use", "use", "CDATA", parts[1]);
+        attributes.addAttribute(namespace, "because", "because", "CDATA", parts[2]);
+        return attributes;
+    }
+
+    private static AttributesImpl getEmojiSourceAttributes(
+            String namespace, UcdLineParser.UcdLine line) {
+        String[] parts = line.getParts();
+        AttributesImpl attributes = new AttributesImpl();
+        attributes.addAttribute(namespace, "unicode", "unicode", "CDATA", parts[0]);
+        attributes.addAttribute(namespace, "docomo", "docomo", "CDATA", parts[1]);
+        attributes.addAttribute(namespace, "kddi", "kddi", "CDATA", parts[2]);
+        attributes.addAttribute(namespace, "softbank", "softbank", "CDATA", parts[3]);
+        return attributes;
+    }
+
+    private static AttributesImpl getNamedSequenceAttributes(
+            String namespace, String name, HashMap<String, String> namedSequences) {
+        AttributesImpl attributes = new AttributesImpl();
+        attributes.addAttribute(namespace, "name", "name", "CDATA", name);
+        attributes.addAttribute(namespace, "cps", "cps", "CDATA", namedSequences.get(name));
+        return attributes;
+    }
+
+    private static AttributesImpl getNCAttributes(String namespace, UcdLineParser.UcdLine line) {
+        String[] parts = line.getParts();
+        AttributesImpl attributes = new AttributesImpl();
+        attributes.addAttribute(namespace, "cp", "cp", "CDATA", parts[0]);
+        attributes.addAttribute(namespace, "old", "old", "CDATA", parts[1]);
+        attributes.addAttribute(namespace, "new", "new", "CDATA", parts[2]);
+        attributes.addAttribute(namespace, "version", "version", "CDATA", parts[3]);
+        return attributes;
+    }
+
+    private static AttributesImpl getSVAttributes(String namespace, UcdLineParser.UcdLine line) {
+        String[] parts = line.getParts();
+        AttributesImpl attributes = new AttributesImpl();
+        attributes.addAttribute(namespace, "cps", "cps", "CDATA", parts[0]);
+        attributes.addAttribute(namespace, "desc", "desc", "CDATA", parts[1]);
+        attributes.addAttribute(
+                namespace, "when", "when", "CDATA", parts[2] != null ? parts[2] : "");
+        return attributes;
+    }
+
+    private boolean isCompatibleVersion(VersionInfo minVersion, VersionInfo maxVersion) {
+        return (indexUnicodeProperties.getUcdVersion().compareTo(minVersion) >= 0
+                && (maxVersion == null
+                        || indexUnicodeProperties.getUcdVersion().compareTo(maxVersion) <= 0));
+    }
+}
diff --git a/unicodetools/src/main/java/org/unicode/xml/UCDPropertyDetail.java b/unicodetools/src/main/java/org/unicode/xml/UCDPropertyDetail.java
new file mode 100644
index 000000000..9dab8117b
--- /dev/null
+++ b/unicodetools/src/main/java/org/unicode/xml/UCDPropertyDetail.java
@@ -0,0 +1,2360 @@
+package org.unicode.xml;
+
+import com.ibm.icu.util.VersionInfo;
+import java.util.LinkedHashSet;
+import java.util.Set;
+import org.unicode.props.UcdProperty;
+
+/**
+ * Helper class for determining how and when UCD properties should be shown in UCDXML. Also includes
+ * information about when a UCDProperty was added to Unicode.
+ */
+public class UCDPropertyDetail {
+
+    private static LinkedHashSet<UCDPropertyDetail> basePropertyDetails =
+            new LinkedHashSet<UCDPropertyDetail>();
+    private static LinkedHashSet<UCDPropertyDetail> cjkPropertyDetails =
+            new LinkedHashSet<UCDPropertyDetail>();
+    private static LinkedHashSet<UCDPropertyDetail> ucdxmlPropertyDetails =
+            new LinkedHashSet<UCDPropertyDetail>();
+    private static LinkedHashSet<UCDPropertyDetail> allPropertyDetails =
+            new LinkedHashSet<UCDPropertyDetail>();
+
+    public static UCDPropertyDetail Age_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Age, VersionInfo.getInstance(3, 2, 0), 1, true, false, false, true);
+    public static UCDPropertyDetail Name_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Name,
+                    VersionInfo.getInstance(1, 1, 0),
+                    2,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Jamo_Short_Name_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Jamo_Short_Name,
+                    VersionInfo.getInstance(5, 1, 0),
+                    3,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail General_Category_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.General_Category,
+                    VersionInfo.getInstance(1, 1, 0),
+                    4,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Canonical_Combining_Class_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Canonical_Combining_Class,
+                    VersionInfo.getInstance(1, 1, 0),
+                    5,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Decomposition_Type_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Decomposition_Type,
+                    VersionInfo.getInstance(1, 1, 0),
+                    6,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Decomposition_Mapping_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Decomposition_Mapping,
+                    VersionInfo.getInstance(1, 1, 0),
+                    7,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Numeric_Type_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Numeric_Type,
+                    VersionInfo.getInstance(1, 1, 0),
+                    8,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Numeric_Value_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Numeric_Value,
+                    VersionInfo.getInstance(1, 1, 0),
+                    9,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Bidi_Class_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Bidi_Class,
+                    VersionInfo.getInstance(1, 1, 0),
+                    10,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Bidi_Paired_Bracket_Type_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Bidi_Paired_Bracket_Type,
+                    VersionInfo.getInstance(6, 3, 0),
+                    11,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Bidi_Paired_Bracket_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Bidi_Paired_Bracket,
+                    VersionInfo.getInstance(6, 3, 0),
+                    12,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Bidi_Mirrored_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Bidi_Mirrored,
+                    VersionInfo.getInstance(1, 1, 0),
+                    13,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Bidi_Mirroring_Glyph_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Bidi_Mirroring_Glyph,
+                    VersionInfo.getInstance(3, 0, 1),
+                    14,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Simple_Uppercase_Mapping_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Simple_Uppercase_Mapping,
+                    VersionInfo.getInstance(1, 1, 0),
+                    15,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Simple_Lowercase_Mapping_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Simple_Lowercase_Mapping,
+                    VersionInfo.getInstance(1, 1, 0),
+                    16,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Simple_Titlecase_Mapping_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Simple_Titlecase_Mapping,
+                    VersionInfo.getInstance(1, 1, 0),
+                    17,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Uppercase_Mapping_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Uppercase_Mapping,
+                    VersionInfo.getInstance(2, 1, 8),
+                    18,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Lowercase_Mapping_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Lowercase_Mapping,
+                    VersionInfo.getInstance(2, 1, 8),
+                    19,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Titlecase_Mapping_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Titlecase_Mapping,
+                    VersionInfo.getInstance(2, 1, 8),
+                    20,
+                    true,
+                    false,
+                    false,
+                    true);
+    //        public static UcdPropertyDetail Special_Case_Condition_Detail = new UcdPropertyDetail
+    // (
+    //            UcdProperty.Special_Case_Condition, VersionInfo.getInstance(1,1,0), 21,
+    //            true, false, false, true);
+    public static UCDPropertyDetail Simple_Case_Folding_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Simple_Case_Folding,
+                    VersionInfo.getInstance(3, 0, 1),
+                    22,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Case_Folding_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Case_Folding,
+                    VersionInfo.getInstance(3, 0, 1),
+                    23,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Joining_Type_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Joining_Type,
+                    VersionInfo.getInstance(2, 0, 0),
+                    24,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Joining_Group_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Joining_Group,
+                    VersionInfo.getInstance(2, 0, 0),
+                    25,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail East_Asian_Width_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.East_Asian_Width,
+                    VersionInfo.getInstance(3, 0, 0),
+                    26,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Line_Break_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Line_Break,
+                    VersionInfo.getInstance(3, 0, 0),
+                    27,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Script_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Script,
+                    VersionInfo.getInstance(3, 1, 0),
+                    28,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Script_Extensions_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Script_Extensions,
+                    VersionInfo.getInstance(6, 1, 0),
+                    29,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Dash_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Dash,
+                    VersionInfo.getInstance(2, 0, 0),
+                    30,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail White_Space_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.White_Space,
+                    VersionInfo.getInstance(2, 0, 0),
+                    31,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Hyphen_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Hyphen,
+                    VersionInfo.getInstance(2, 0, 0),
+                    32,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Quotation_Mark_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Quotation_Mark,
+                    VersionInfo.getInstance(2, 0, 0),
+                    33,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Radical_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Radical,
+                    VersionInfo.getInstance(3, 2, 0),
+                    34,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Ideographic_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Ideographic,
+                    VersionInfo.getInstance(2, 0, 0),
+                    35,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Unified_Ideograph_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Unified_Ideograph,
+                    VersionInfo.getInstance(3, 2, 0),
+                    36,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail IDS_Binary_Operator_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.IDS_Binary_Operator,
+                    VersionInfo.getInstance(3, 2, 0),
+                    37,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail IDS_Trinary_Operator_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.IDS_Trinary_Operator,
+                    VersionInfo.getInstance(3, 2, 0),
+                    38,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Hangul_Syllable_Type_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Hangul_Syllable_Type,
+                    VersionInfo.getInstance(4, 0, 0),
+                    39,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Default_Ignorable_Code_Point_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Default_Ignorable_Code_Point,
+                    VersionInfo.getInstance(3, 2, 0),
+                    40,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Other_Default_Ignorable_Code_Point_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Other_Default_Ignorable_Code_Point,
+                    VersionInfo.getInstance(3, 2, 0),
+                    41,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Alphabetic_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Alphabetic,
+                    VersionInfo.getInstance(1, 1, 0),
+                    42,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Other_Alphabetic_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Other_Alphabetic,
+                    VersionInfo.getInstance(3, 1, 0),
+                    43,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Uppercase_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Uppercase,
+                    VersionInfo.getInstance(3, 1, 0),
+                    44,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Other_Uppercase_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Other_Uppercase,
+                    VersionInfo.getInstance(3, 1, 0),
+                    45,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Lowercase_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Lowercase,
+                    VersionInfo.getInstance(3, 1, 0),
+                    46,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Other_Lowercase_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Other_Lowercase,
+                    VersionInfo.getInstance(3, 1, 0),
+                    47,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Math_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Math,
+                    VersionInfo.getInstance(2, 0, 0),
+                    48,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Other_Math_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Other_Math,
+                    VersionInfo.getInstance(3, 1, 0),
+                    49,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Hex_Digit_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Hex_Digit,
+                    VersionInfo.getInstance(2, 0, 0),
+                    50,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail ASCII_Hex_Digit_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.ASCII_Hex_Digit,
+                    VersionInfo.getInstance(3, 1, 1),
+                    51,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Noncharacter_Code_Point_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Noncharacter_Code_Point,
+                    VersionInfo.getInstance(3, 0, 1),
+                    52,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Variation_Selector_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Variation_Selector,
+                    VersionInfo.getInstance(4, 0, 1),
+                    53,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Bidi_Control_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Bidi_Control,
+                    VersionInfo.getInstance(2, 0, 0),
+                    54,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Join_Control_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Join_Control,
+                    VersionInfo.getInstance(2, 0, 0),
+                    55,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Grapheme_Base_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Grapheme_Base,
+                    VersionInfo.getInstance(3, 2, 0),
+                    56,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Grapheme_Extend_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Grapheme_Extend,
+                    VersionInfo.getInstance(3, 2, 0),
+                    57,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Other_Grapheme_Extend_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Other_Grapheme_Extend,
+                    VersionInfo.getInstance(3, 2, 0),
+                    58,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Grapheme_Link_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Grapheme_Link,
+                    VersionInfo.getInstance(3, 2, 0),
+                    59,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Sentence_Terminal_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Sentence_Terminal,
+                    VersionInfo.getInstance(9, 0, 0),
+                    60,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Extender_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Extender,
+                    VersionInfo.getInstance(2, 0, 0),
+                    61,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Terminal_Punctuation_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Terminal_Punctuation,
+                    VersionInfo.getInstance(2, 0, 0),
+                    62,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Diacritic_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Diacritic,
+                    VersionInfo.getInstance(2, 0, 0),
+                    63,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Deprecated_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Deprecated,
+                    VersionInfo.getInstance(3, 2, 0),
+                    64,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail ID_Start_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.ID_Start,
+                    VersionInfo.getInstance(3, 1, 0),
+                    65,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Other_ID_Start_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Other_ID_Start,
+                    VersionInfo.getInstance(4, 0, 0),
+                    66,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail XID_Start_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.XID_Start,
+                    VersionInfo.getInstance(3, 1, 0),
+                    67,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail ID_Continue_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.ID_Continue,
+                    VersionInfo.getInstance(3, 1, 0),
+                    68,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Other_ID_Continue_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Other_ID_Continue,
+                    VersionInfo.getInstance(4, 1, 0),
+                    69,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail XID_Continue_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.XID_Continue,
+                    VersionInfo.getInstance(3, 1, 0),
+                    70,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Soft_Dotted_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Soft_Dotted,
+                    VersionInfo.getInstance(3, 2, 0),
+                    71,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Logical_Order_Exception_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Logical_Order_Exception,
+                    VersionInfo.getInstance(3, 2, 0),
+                    72,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Pattern_White_Space_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Pattern_White_Space,
+                    VersionInfo.getInstance(4, 1, 0),
+                    73,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Pattern_Syntax_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Pattern_Syntax,
+                    VersionInfo.getInstance(4, 1, 0),
+                    74,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Grapheme_Cluster_Break_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Grapheme_Cluster_Break,
+                    VersionInfo.getInstance(4, 1, 0),
+                    75,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Word_Break_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Word_Break,
+                    VersionInfo.getInstance(4, 1, 0),
+                    76,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Sentence_Break_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Sentence_Break,
+                    VersionInfo.getInstance(4, 1, 0),
+                    77,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Composition_Exclusion_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Composition_Exclusion,
+                    VersionInfo.getInstance(3, 0, 0),
+                    78,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Full_Composition_Exclusion_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Full_Composition_Exclusion,
+                    VersionInfo.getInstance(3, 1, 0),
+                    79,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail NFC_Quick_Check_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.NFC_Quick_Check,
+                    VersionInfo.getInstance(3, 2, 0),
+                    80,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail NFD_Quick_Check_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.NFD_Quick_Check,
+                    VersionInfo.getInstance(3, 2, 0),
+                    81,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail NFKC_Quick_Check_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.NFKC_Quick_Check,
+                    VersionInfo.getInstance(5, 2, 0),
+                    82,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail NFKD_Quick_Check_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.NFKD_Quick_Check,
+                    VersionInfo.getInstance(3, 2, 0),
+                    83,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Expands_On_NFC_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Expands_On_NFC,
+                    VersionInfo.getInstance(3, 2, 0),
+                    84,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Expands_On_NFD_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Expands_On_NFD,
+                    VersionInfo.getInstance(3, 2, 0),
+                    85,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Expands_On_NFKC_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Expands_On_NFKC,
+                    VersionInfo.getInstance(3, 2, 0),
+                    86,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Expands_On_NFKD_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Expands_On_NFKD,
+                    VersionInfo.getInstance(3, 2, 0),
+                    87,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail FC_NFC_Closure_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.FC_NFKC_Closure,
+                    VersionInfo.getInstance(3, 1, 0),
+                    88,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Case_Ignorable_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Case_Ignorable,
+                    VersionInfo.getInstance(5, 2, 0),
+                    89,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Cased_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Cased,
+                    VersionInfo.getInstance(5, 2, 0),
+                    90,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Changes_When_CaseFolded_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Changes_When_Casefolded,
+                    VersionInfo.getInstance(5, 2, 0),
+                    91,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Changes_When_CaseMapped_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Changes_When_Casemapped,
+                    VersionInfo.getInstance(5, 2, 0),
+                    92,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Changes_When_NFKC_Casefolded_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Changes_When_NFKC_Casefolded,
+                    VersionInfo.getInstance(5, 2, 0),
+                    93,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Changes_When_Lowercased_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Changes_When_Lowercased,
+                    VersionInfo.getInstance(5, 2, 0),
+                    94,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Changes_When_Titlecased_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Changes_When_Titlecased,
+                    VersionInfo.getInstance(5, 2, 0),
+                    95,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Changes_When_Uppercased_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Changes_When_Uppercased,
+                    VersionInfo.getInstance(5, 2, 0),
+                    96,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail NFKC_Casefold_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.NFKC_Casefold,
+                    VersionInfo.getInstance(5, 2, 0),
+                    97,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Indic_Syllabic_Category_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Indic_Syllabic_Category,
+                    VersionInfo.getInstance(6, 1, 0),
+                    98,
+                    true,
+                    false,
+                    false,
+                    true);
+    //        public static UcdPropertyDetail Indic_Matra_Category_Detail = new UcdPropertyDetail (
+    //            UcdProperty.Indic_Matra_Category, VersionInfo.getInstance(6,1,0),
+    // VersionInfo.getInstance(7,0,0), 99,
+    //            true, false, false, true);
+    public static UCDPropertyDetail Indic_Positional_Category_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Indic_Positional_Category,
+                    VersionInfo.getInstance(8, 0, 0),
+                    100,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail kJa_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kJa,
+                    VersionInfo.getInstance(8, 0, 0),
+                    101,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail Prepended_Concatenation_Mark_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Prepended_Concatenation_Mark,
+                    VersionInfo.getInstance(9, 0, 0),
+                    102,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Vertical_Orientation_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Vertical_Orientation,
+                    VersionInfo.getInstance(10, 0, 0),
+                    103,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Regional_Indicator_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Regional_Indicator,
+                    VersionInfo.getInstance(10, 0, 0),
+                    104,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Block_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Block,
+                    VersionInfo.getInstance(2, 0, 0),
+                    105,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Equivalent_Unified_Ideograph_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Equivalent_Unified_Ideograph,
+                    VersionInfo.getInstance(11, 0, 0),
+                    106,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kCompatibilityVariant_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kCompatibilityVariant,
+                    VersionInfo.getInstance(3, 2, 0),
+                    107,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kRSUnicode_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kRSUnicode,
+                    VersionInfo.getInstance(2, 0, 0),
+                    108,
+                    false,
+                    true,
+                    false,
+                    true);
+    //        public static UcdPropertyDetail kIRG_RSIndex_Detail = new UcdPropertyDetail (
+    //            UcdProperty.kIRG_RSIndex, VersionInfo.getInstance(11,0,0), 109,
+    //            false, true, false, true);
+    public static UCDPropertyDetail kIRG_GSource_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRG_GSource,
+                    VersionInfo.getInstance(3, 0, 0),
+                    110,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kIRG_TSource_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRG_TSource,
+                    VersionInfo.getInstance(3, 0, 0),
+                    111,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kIRG_JSource_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRG_JSource,
+                    VersionInfo.getInstance(3, 0, 0),
+                    112,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kIRG_KSource_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRG_KSource,
+                    VersionInfo.getInstance(3, 0, 0),
+                    113,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kIRG_KPSource_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRG_KPSource,
+                    VersionInfo.getInstance(3, 1, 1),
+                    114,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kIRG_VSource_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRG_VSource,
+                    VersionInfo.getInstance(3, 0, 0),
+                    115,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kIRG_HSource_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRG_HSource,
+                    VersionInfo.getInstance(3, 1, 0),
+                    116,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kIRG_USource_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRG_USource,
+                    VersionInfo.getInstance(4, 0, 1),
+                    117,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kIRG_MSource_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRG_MSource,
+                    VersionInfo.getInstance(5, 2, 0),
+                    118,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kIRG_UKSource_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRG_UKSource,
+                    VersionInfo.getInstance(13, 0, 0),
+                    119,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kIRG_SSource_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRG_SSource,
+                    VersionInfo.getInstance(13, 0, 0),
+                    120,
+                    false,
+                    true,
+                    true,
+                    true);
+    public static UCDPropertyDetail kIICore_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIICore,
+                    VersionInfo.getInstance(4, 1, 0),
+                    121,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kUnihanCore2020_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kUnihanCore2020,
+                    VersionInfo.getInstance(13, 0, 0),
+                    122,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kGB0_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kGB0,
+                    VersionInfo.getInstance(2, 0, 0),
+                    123,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kGB1_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kGB1,
+                    VersionInfo.getInstance(2, 0, 0),
+                    124,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kGB3_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kGB3,
+                    VersionInfo.getInstance(2, 0, 0),
+                    125,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kGB5_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kGB5,
+                    VersionInfo.getInstance(2, 0, 0),
+                    126,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kGB7_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kGB7,
+                    VersionInfo.getInstance(2, 0, 0),
+                    127,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kGB8_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kGB8,
+                    VersionInfo.getInstance(2, 0, 0),
+                    128,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kCNS1986_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kCNS1986,
+                    VersionInfo.getInstance(2, 0, 0),
+                    129,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kCNS1992_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kCNS1992,
+                    VersionInfo.getInstance(2, 0, 0),
+                    130,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kJis0_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kJis0,
+                    VersionInfo.getInstance(2, 0, 0),
+                    131,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kJis1_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kJis1,
+                    VersionInfo.getInstance(2, 0, 0),
+                    132,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kJIS0213_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kJIS0213,
+                    VersionInfo.getInstance(3, 1, 1),
+                    133,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kKSC0_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kKSC0,
+                    VersionInfo.getInstance(2, 0, 0),
+                    VersionInfo.getInstance(15, 1, 0),
+                    134,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kKSC1_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kKSC1,
+                    VersionInfo.getInstance(2, 0, 0),
+                    VersionInfo.getInstance(15, 1, 0),
+                    135,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kKPS0_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kKPS0,
+                    VersionInfo.getInstance(3, 1, 1),
+                    VersionInfo.getInstance(15, 1, 0),
+                    136,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kKPS1_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kKPS1,
+                    VersionInfo.getInstance(3, 1, 1),
+                    VersionInfo.getInstance(15, 1, 0),
+                    137,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kHKSCS_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kHKSCS,
+                    VersionInfo.getInstance(3, 1, 1),
+                    VersionInfo.getInstance(15, 1, 0),
+                    138,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kCantonese_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kCantonese,
+                    VersionInfo.getInstance(2, 0, 0),
+                    139,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kHangul_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kHangul,
+                    VersionInfo.getInstance(5, 0, 0),
+                    140,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kDefinition_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kDefinition,
+                    VersionInfo.getInstance(2, 0, 0),
+                    141,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kHanYu_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kHanYu,
+                    VersionInfo.getInstance(2, 0, 0),
+                    142,
+                    false,
+                    true,
+                    false,
+                    true);
+    //        public static UcdPropertyDetail kAlternateHanYu_Detail = new UcdPropertyDetail (
+    //            UcdProperty.kAlternateHanYu, VersionInfo.getInstance(2,0,0),
+    // VersionInfo.getInstance(3,1,1), 143,
+    //            false, true, false, true);
+    public static UCDPropertyDetail kMandarin_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kMandarin,
+                    VersionInfo.getInstance(2, 0, 0),
+                    144,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kCihaiT_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kCihaiT,
+                    VersionInfo.getInstance(3, 2, 0),
+                    145,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kSBGY_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kSBGY,
+                    VersionInfo.getInstance(3, 2, 0),
+                    146,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kNelson_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kNelson,
+                    VersionInfo.getInstance(2, 0, 0),
+                    147,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kCowles_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kCowles,
+                    VersionInfo.getInstance(3, 1, 1),
+                    148,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kMatthews_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kMatthews,
+                    VersionInfo.getInstance(2, 0, 0),
+                    149,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kOtherNumeric_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kOtherNumeric,
+                    VersionInfo.getInstance(3, 2, 0),
+                    150,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kPhonetic_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kPhonetic,
+                    VersionInfo.getInstance(3, 1, 0),
+                    151,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kGSR_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kGSR,
+                    VersionInfo.getInstance(4, 0, 1),
+                    152,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kFenn_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kFenn,
+                    VersionInfo.getInstance(3, 1, 1),
+                    153,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kFennIndex_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kFennIndex,
+                    VersionInfo.getInstance(4, 1, 0),
+                    154,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kKarlgren_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kKarlgren,
+                    VersionInfo.getInstance(3, 1, 1),
+                    155,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kCangjie_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kCangjie,
+                    VersionInfo.getInstance(3, 1, 1),
+                    156,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kMeyerWempe_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kMeyerWempe,
+                    VersionInfo.getInstance(3, 1, 0),
+                    157,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kSimplifiedVariant_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kSimplifiedVariant,
+                    VersionInfo.getInstance(2, 0, 0),
+                    158,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kTraditionalVariant_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kTraditionalVariant,
+                    VersionInfo.getInstance(2, 0, 0),
+                    159,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kSpecializedSemanticVariant_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kSpecializedSemanticVariant,
+                    VersionInfo.getInstance(2, 0, 0),
+                    160,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kSemanticVariant_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kSemanticVariant,
+                    VersionInfo.getInstance(2, 0, 0),
+                    161,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kVietnamese_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kVietnamese,
+                    VersionInfo.getInstance(3, 1, 1),
+                    162,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kLau_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kLau,
+                    VersionInfo.getInstance(3, 1, 1),
+                    163,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kTang_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kTang,
+                    VersionInfo.getInstance(2, 0, 0),
+                    164,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kZVariant_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kZVariant,
+                    VersionInfo.getInstance(2, 0, 0),
+                    165,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kJapaneseKun_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kJapaneseKun,
+                    VersionInfo.getInstance(2, 0, 0),
+                    166,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kJapaneseOn_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kJapaneseOn,
+                    VersionInfo.getInstance(2, 0, 0),
+                    167,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kKangXi_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kKangXi,
+                    VersionInfo.getInstance(2, 0, 0),
+                    168,
+                    false,
+                    true,
+                    false,
+                    true);
+    //    public static UcdPropertyDetail kAlternateKangXi_Detail = new UcdPropertyDetail (
+    //            UcdProperty.kAlternateKangXi, VersionInfo.getInstance(2,0,0),
+    // VersionInfo.getInstance(4,0,1), 169,
+    //            false, true, false, true);
+    public static UCDPropertyDetail kBigFive_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kBigFive,
+                    VersionInfo.getInstance(2, 0, 0),
+                    170,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kCCCII_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kCCCII,
+                    VersionInfo.getInstance(2, 0, 0),
+                    171,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kDaeJaweon_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kDaeJaweon,
+                    VersionInfo.getInstance(2, 0, 0),
+                    172,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kEACC_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kEACC,
+                    VersionInfo.getInstance(2, 0, 0),
+                    173,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kFrequency_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kFrequency,
+                    VersionInfo.getInstance(3, 2, 0),
+                    VersionInfo.getInstance(16, 0, 0),
+                    174,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kGradeLevel_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kGradeLevel,
+                    VersionInfo.getInstance(3, 2, 0),
+                    175,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kHDZRadBreak_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kHDZRadBreak,
+                    VersionInfo.getInstance(4, 1, 0),
+                    176,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kHKGlyph_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kHKGlyph,
+                    VersionInfo.getInstance(3, 1, 1),
+                    177,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kHanyuPinlu_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kHanyuPinlu,
+                    VersionInfo.getInstance(4, 0, 1),
+                    178,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kHanyuPinyin_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kHanyuPinyin,
+                    VersionInfo.getInstance(5, 2, 0),
+                    179,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kIRGHanyuDaZidian_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRGHanyuDaZidian,
+                    VersionInfo.getInstance(3, 0, 0),
+                    180,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kIRGKangXi_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRGKangXi,
+                    VersionInfo.getInstance(3, 0, 0),
+                    181,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kIRGDaeJaweon_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRGDaeJaweon,
+                    VersionInfo.getInstance(3, 0, 0),
+                    182,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kIRGDaiKanwaZiten_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIRGDaiKanwaZiten,
+                    VersionInfo.getInstance(3, 0, 0),
+                    VersionInfo.getInstance(15, 1, 0),
+                    183,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kKorean_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kKorean,
+                    VersionInfo.getInstance(2, 0, 0),
+                    184,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kMainlandTelegraph_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kMainlandTelegraph,
+                    VersionInfo.getInstance(2, 0, 0),
+                    185,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kMorohashi_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kMorohashi,
+                    VersionInfo.getInstance(2, 0, 0),
+                    186,
+                    false,
+                    true,
+                    false,
+                    true);
+    //    public static UcdPropertyDetail kAlternateMorohashi_Detail = new UcdPropertyDetail (
+    //            UcdProperty.kAlternateMorohashi, VersionInfo.getInstance(2,0,0),
+    // VersionInfo.getInstance(4,0,1), 187,
+    //            false, true, false, true);
+    public static UCDPropertyDetail kPrimaryNumeric_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kPrimaryNumeric,
+                    VersionInfo.getInstance(3, 2, 0),
+                    188,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kTaiwanTelegraph_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kTaiwanTelegraph,
+                    VersionInfo.getInstance(2, 0, 0),
+                    189,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kXerox_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kXerox,
+                    VersionInfo.getInstance(2, 0, 0),
+                    190,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kPseudoGB1_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kPseudoGB1,
+                    VersionInfo.getInstance(2, 0, 0),
+                    191,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kIBMJapan_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kIBMJapan,
+                    VersionInfo.getInstance(2, 0, 0),
+                    192,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kAccountingNumeric_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kAccountingNumeric,
+                    VersionInfo.getInstance(3, 2, 0),
+                    193,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kCheungBauer_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kCheungBauer,
+                    VersionInfo.getInstance(5, 0, 0),
+                    194,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kCheungBauerIndex_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kCheungBauerIndex,
+                    VersionInfo.getInstance(5, 0, 0),
+                    195,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kFourCornerCode_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kFourCornerCode,
+                    VersionInfo.getInstance(5, 0, 0),
+                    196,
+                    false,
+                    true,
+                    false,
+                    true);
+    //    public static UcdPropertyDetail kWubi_Detail = new UcdPropertyDetail (
+    //            UcdProperty.kWubi, VersionInfo.getInstance(11,0,0), 197,
+    //            false, true, false, true);
+    public static UCDPropertyDetail kXHC1983_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kXHC1983,
+                    VersionInfo.getInstance(5, 1, 0),
+                    198,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kJinmeiyoKanji_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kJinmeiyoKanji,
+                    VersionInfo.getInstance(11, 0, 0),
+                    199,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kJoyoKanji_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kJoyoKanji,
+                    VersionInfo.getInstance(11, 0, 0),
+                    200,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kKoreanEducationHanja_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kKoreanEducationHanja,
+                    VersionInfo.getInstance(11, 0, 0),
+                    201,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kKoreanName_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kKoreanName,
+                    VersionInfo.getInstance(11, 0, 0),
+                    202,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kTGH_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kTGH,
+                    VersionInfo.getInstance(11, 0, 0),
+                    203,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kTGHZ2013_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kTGHZ2013,
+                    VersionInfo.getInstance(13, 0, 0),
+                    204,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kSpoofingVariant_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kSpoofingVariant,
+                    VersionInfo.getInstance(13, 0, 0),
+                    205,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kRSKanWa_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kRSKanWa,
+                    VersionInfo.getInstance(2, 0, 0),
+                    206,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kRSJapanese_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kRSJapanese,
+                    VersionInfo.getInstance(2, 0, 0),
+                    207,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kRSKorean_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kRSKorean,
+                    VersionInfo.getInstance(2, 0, 0),
+                    208,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kRSKangXi_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kRSKangXi,
+                    VersionInfo.getInstance(2, 0, 0),
+                    VersionInfo.getInstance(15, 1, 0),
+                    209,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kRSAdobe_Japan1_6_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kRSAdobe_Japan1_6,
+                    VersionInfo.getInstance(4, 1, 0),
+                    210,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kTotalStrokes_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kTotalStrokes,
+                    VersionInfo.getInstance(3, 1, 0),
+                    211,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kRSTUnicode_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kRSTUnicode,
+                    VersionInfo.getInstance(9, 0, 0),
+                    212,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kTGT_MergedSrc_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kTGT_MergedSrc,
+                    VersionInfo.getInstance(9, 0, 0),
+                    213,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kSrc_NushuDuben_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kSrc_NushuDuben,
+                    VersionInfo.getInstance(10, 0, 0),
+                    214,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kReading_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kReading,
+                    VersionInfo.getInstance(10, 0, 0),
+                    215,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail ISO_Comment_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.ISO_Comment,
+                    VersionInfo.getInstance(11, 0, 0),
+                    216,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Unicode_1_Name_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Unicode_1_Name,
+                    VersionInfo.getInstance(2, 0, 0),
+                    217,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Name_Alias_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Name_Alias,
+                    VersionInfo.getInstance(5, 0, 0),
+                    218,
+                    false,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Emoji_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Emoji,
+                    VersionInfo.getInstance(13, 0, 0),
+                    219,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Emoji_Presentation_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Emoji_Presentation,
+                    VersionInfo.getInstance(13, 0, 0),
+                    220,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Emoji_Modifier_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Emoji_Modifier,
+                    VersionInfo.getInstance(13, 0, 0),
+                    221,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Emoji_Modifier_Base_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Emoji_Modifier_Base,
+                    VersionInfo.getInstance(13, 0, 0),
+                    222,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Emoji_Component_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Emoji_Component,
+                    VersionInfo.getInstance(13, 0, 0),
+                    223,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Extended_Pictographic_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Extended_Pictographic,
+                    VersionInfo.getInstance(13, 0, 0),
+                    224,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail kStrange_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kStrange,
+                    VersionInfo.getInstance(14, 0, 0),
+                    225,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kAlternateTotalStrokes_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kAlternateTotalStrokes,
+                    VersionInfo.getInstance(15, 0, 0),
+                    226,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail NFKC_Simple_Casefold_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.NFKC_Simple_Casefold,
+                    VersionInfo.getInstance(15, 1, 0),
+                    227,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail ID_Compat_Math_Start_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.ID_Compat_Math_Start,
+                    VersionInfo.getInstance(15, 1, 0),
+                    228,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail ID_Compat_Math_Continue_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.ID_Compat_Math_Continue,
+                    VersionInfo.getInstance(15, 1, 0),
+                    229,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail IDS_Unary_Operator_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.IDS_Unary_Operator,
+                    VersionInfo.getInstance(15, 1, 0),
+                    230,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail kJapanese_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kJapanese,
+                    VersionInfo.getInstance(15, 1, 0),
+                    231,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kMojiJoho_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kMojiJoho,
+                    VersionInfo.getInstance(15, 1, 0),
+                    232,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kSMSZD2003Index_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kSMSZD2003Index,
+                    VersionInfo.getInstance(15, 1, 0),
+                    233,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kSMSZD2003Readings_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kSMSZD2003Readings,
+                    VersionInfo.getInstance(15, 1, 0),
+                    234,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kVietnameseNumeric_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kVietnameseNumeric,
+                    VersionInfo.getInstance(15, 1, 0),
+                    235,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kZhuang_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kZhuang,
+                    VersionInfo.getInstance(16, 0, 0),
+                    236,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail kZhuangNumeric_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kZhuangNumeric,
+                    VersionInfo.getInstance(15, 1, 0),
+                    237,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail Indic_Conjunct_Break_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Indic_Conjunct_Break,
+                    VersionInfo.getInstance(15, 1, 0),
+                    238,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail Modifier_Combining_Mark_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Modifier_Combining_Mark,
+                    VersionInfo.getInstance(16, 0, 0),
+                    239,
+                    true,
+                    false,
+                    false,
+                    true);
+    public static UCDPropertyDetail kFanqie_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.kFanqie,
+                    VersionInfo.getInstance(16, 0, 0),
+                    240,
+                    false,
+                    true,
+                    false,
+                    true);
+    public static UCDPropertyDetail Basic_Emoji_Detail =
+            new UCDPropertyDetail(UcdProperty.Basic_Emoji, -1, false, false, false, false);
+    public static UCDPropertyDetail CJK_Radical_Detail =
+            new UCDPropertyDetail(UcdProperty.CJK_Radical, -2, false, false, false, false);
+    public static UCDPropertyDetail Confusable_MA_Detail =
+            new UCDPropertyDetail(UcdProperty.Confusable_MA, -3, false, false, false, false);
+    public static UCDPropertyDetail Confusable_ML_Detail =
+            new UCDPropertyDetail(UcdProperty.Confusable_ML, -4, false, false, false, false);
+    public static UCDPropertyDetail Confusable_SA_Detail =
+            new UCDPropertyDetail(UcdProperty.Confusable_SA, -5, false, false, false, false);
+    public static UCDPropertyDetail Confusable_SL_Detail =
+            new UCDPropertyDetail(UcdProperty.Confusable_SL, -6, false, false, false, false);
+    public static UCDPropertyDetail Do_Not_Emit_Preferred_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Do_Not_Emit_Preferred, -7, false, false, false, false);
+    public static UCDPropertyDetail Do_Not_Emit_Type_Detail =
+            new UCDPropertyDetail(UcdProperty.Do_Not_Emit_Type, -8, false, false, false, false);
+    public static UCDPropertyDetail Emoji_DCM_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Emoji_DCM,
+                    VersionInfo.getInstance(6, 0, 0),
+                    -9,
+                    false,
+                    false,
+                    false,
+                    false);
+    public static UCDPropertyDetail Emoji_KDDI_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Emoji_KDDI,
+                    VersionInfo.getInstance(6, 0, 0),
+                    -10,
+                    false,
+                    false,
+                    false,
+                    false);
+    public static UCDPropertyDetail Emoji_SB_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Emoji_SB,
+                    VersionInfo.getInstance(6, 0, 0),
+                    -11,
+                    false,
+                    false,
+                    false,
+                    false);
+    public static UCDPropertyDetail Identifier_Status_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Identifier_Status,
+                    VersionInfo.getInstance(9, 0, 0),
+                    -12,
+                    false,
+                    false,
+                    false,
+                    false);
+    public static UCDPropertyDetail Identifier_Type_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Identifier_Type,
+                    VersionInfo.getInstance(9, 0, 0),
+                    -13,
+                    false,
+                    false,
+                    false,
+                    false);
+    public static UCDPropertyDetail Idn_2008_Detail =
+            new UCDPropertyDetail(UcdProperty.Idn_2008, -14, false, false, false, false);
+    public static UCDPropertyDetail Idn_Mapping_Detail =
+            new UCDPropertyDetail(UcdProperty.Idn_Mapping, -15, false, false, false, false);
+    public static UCDPropertyDetail Idn_Status_Detail =
+            new UCDPropertyDetail(UcdProperty.Idn_Status, -16, false, false, false, false);
+    public static UCDPropertyDetail Named_Sequences_Detail =
+            new UCDPropertyDetail(UcdProperty.Named_Sequences, -17, false, false, false, false);
+    public static UCDPropertyDetail Named_Sequences_Prov_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Named_Sequences_Prov, -18, false, false, false, false);
+    public static UCDPropertyDetail Other_Joining_Type_Detail =
+            new UCDPropertyDetail(UcdProperty.Other_Joining_Type, -19, false, false, false, false);
+    public static UCDPropertyDetail RGI_Emoji_Flag_Sequence_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.RGI_Emoji_Flag_Sequence, -20, false, false, false, false);
+    public static UCDPropertyDetail RGI_Emoji_Keycap_Sequence_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.RGI_Emoji_Keycap_Sequence, -21, false, false, false, false);
+    public static UCDPropertyDetail RGI_Emoji_Modifier_Sequence_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.RGI_Emoji_Modifier_Sequence, -22, false, false, false, false);
+    public static UCDPropertyDetail RGI_Emoji_Tag_Sequence_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.RGI_Emoji_Tag_Sequence, -23, false, false, false, false);
+    public static UCDPropertyDetail RGI_Emoji_Zwj_Sequence_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.RGI_Emoji_Zwj_Sequence, -24, false, false, false, false);
+    public static UCDPropertyDetail Standardized_Variant_Detail =
+            new UCDPropertyDetail(
+                    UcdProperty.Standardized_Variant, -25, false, false, false, false);
+
+    private UcdProperty ucdProperty;
+    private VersionInfo minVersion;
+    private VersionInfo maxVersion;
+    private int sortOrder;
+    private boolean isBaseAttribute;
+    private boolean isCJKAttribute;
+    private boolean isCJKShowIfEmpty;
+    private boolean isOrgUCDXMLAttribute;
+
+    private UCDPropertyDetail(
+            UcdProperty ucdProperty,
+            VersionInfo minVersion,
+            int sortOrder,
+            boolean isBaseAttribute,
+            boolean isCJKAttribute,
+            boolean isCJKShowIfEmpty,
+            boolean isOrgUCDXMLAttribute) {
+        this(
+                ucdProperty,
+                minVersion,
+                null,
+                sortOrder,
+                isBaseAttribute,
+                isCJKAttribute,
+                isCJKShowIfEmpty,
+                isOrgUCDXMLAttribute);
+    }
+
+    private UCDPropertyDetail(
+            UcdProperty ucdProperty,
+            int sortOrder,
+            boolean isBaseAttribute,
+            boolean isCJKAttribute,
+            boolean isCJKShowIfEmpty,
+            boolean isOrgUCDXMLAttribute) {
+        this(
+                ucdProperty,
+                null,
+                null,
+                sortOrder,
+                isBaseAttribute,
+                isCJKAttribute,
+                isCJKShowIfEmpty,
+                isOrgUCDXMLAttribute);
+    }
+
+    private UCDPropertyDetail(
+            UcdProperty ucdProperty,
+            VersionInfo minVersion,
+            VersionInfo maxVersion,
+            int sortOrder,
+            boolean isBaseAttribute,
+            boolean isCJKAttribute,
+            boolean isCJKShowIfEmpty,
+            boolean isOrgUCDXMLAttribute) {
+        this.ucdProperty = ucdProperty;
+        this.minVersion = minVersion;
+        this.maxVersion = maxVersion;
+        this.sortOrder = sortOrder;
+        this.isBaseAttribute = isBaseAttribute;
+        this.isCJKAttribute = isCJKAttribute;
+        this.isCJKShowIfEmpty = isCJKShowIfEmpty;
+        this.isOrgUCDXMLAttribute = isOrgUCDXMLAttribute;
+
+        allPropertyDetails.add(this);
+        if (isBaseAttribute) {
+            basePropertyDetails.add(this);
+            ucdxmlPropertyDetails.add(this);
+        }
+        if (isCJKAttribute) {
+            cjkPropertyDetails.add(this);
+            ucdxmlPropertyDetails.add(this);
+        }
+    }
+
+    public static Set<UCDPropertyDetail> values() {
+        return allPropertyDetails;
+    }
+
+    public static Set<UCDPropertyDetail> baseValues() {
+        return basePropertyDetails;
+    }
+
+    public static Set<UCDPropertyDetail> cjkValues() {
+        return cjkPropertyDetails;
+    }
+
+    public static Set<UCDPropertyDetail> ucdxmlValues() {
+        return ucdxmlPropertyDetails;
+    }
+
+    public UcdProperty getUcdProperty() {
+        return this.ucdProperty;
+    }
+
+    public VersionInfo getMinVersion() {
+        return this.minVersion;
+    }
+
+    public VersionInfo getMaxVersion() {
+        return this.maxVersion;
+    }
+
+    public boolean isBaseAttribute() {
+        return this.isBaseAttribute;
+    }
+
+    public boolean isCJKAttribute() {
+        return this.isCJKAttribute;
+    }
+
+    public boolean isCJKShowIfEmpty() {
+        return this.isCJKShowIfEmpty;
+    }
+
+    public boolean isOrgUCDXMLAttribute() {
+        return this.isOrgUCDXMLAttribute;
+    }
+}
diff --git a/unicodetools/src/main/java/org/unicode/xml/UCDSectionComponent.java b/unicodetools/src/main/java/org/unicode/xml/UCDSectionComponent.java
new file mode 100644
index 000000000..0cef1e345
--- /dev/null
+++ b/unicodetools/src/main/java/org/unicode/xml/UCDSectionComponent.java
@@ -0,0 +1,29 @@
+package org.unicode.xml;
+
+import com.ibm.icu.util.VersionInfo;
+import org.unicode.props.UcdProperty;
+
+/** Helper class that defines an object that stores the version range of a given UcdProperty. */
+public class UCDSectionComponent {
+    private final VersionInfo minVersion;
+    private final VersionInfo maxVersion;
+    private final UcdProperty ucdProperty;
+
+    UCDSectionComponent(VersionInfo minVersion, VersionInfo maxVersion, UcdProperty ucdProperty) {
+        this.minVersion = minVersion;
+        this.maxVersion = maxVersion;
+        this.ucdProperty = ucdProperty;
+    }
+
+    public VersionInfo getMinVersion() {
+        return this.minVersion;
+    }
+
+    public VersionInfo getMaxVersion() {
+        return this.maxVersion;
+    }
+
+    public UcdProperty getUcdProperty() {
+        return this.ucdProperty;
+    }
+}
diff --git a/unicodetools/src/main/java/org/unicode/xml/UCDSectionDetail.java b/unicodetools/src/main/java/org/unicode/xml/UCDSectionDetail.java
new file mode 100644
index 000000000..6db3cf82b
--- /dev/null
+++ b/unicodetools/src/main/java/org/unicode/xml/UCDSectionDetail.java
@@ -0,0 +1,229 @@
+package org.unicode.xml;
+
+import com.ibm.icu.util.VersionInfo;
+import org.unicode.props.UcdProperty;
+
+/**
+ * Helper class that defines an object that stores information about a section of the UCDXML file.
+ * Information includes the section name, the type of elements that the section contains, and the
+ * version range of the section.
+ */
+public class UCDSectionDetail {
+
+    public enum UcdSection {
+        BLOCKS(
+                "blocks",
+                "block",
+                VersionInfo.getInstance(1, 1, 0),
+                null,
+                Blocks_Detail,
+                true,
+                true),
+        CJKRADICALS(
+                "cjk-radicals",
+                "cjk-radical",
+                VersionInfo.getInstance(1, 1, 0),
+                null,
+                CJKRadicals_Detail,
+                false,
+                false),
+        DONOTEMIT(
+                "do-not-emit",
+                "instead",
+                VersionInfo.getInstance(16, 0, 0),
+                null,
+                DoNotEmit_Detail,
+                false,
+                false),
+        EMOJISOURCES(
+                "emoji-sources",
+                "emoji-source",
+                VersionInfo.getInstance(1, 1, 0),
+                null,
+                EmojiSources_Detail,
+                true,
+                false),
+        NAMEDSEQUENCES(
+                "named-sequences",
+                "named-sequence",
+                VersionInfo.getInstance(1, 1, 0),
+                null,
+                NamedSequences_Detail,
+                false,
+                false),
+        PROVISIONALNAMEDSEQUENCES(
+                "provisional-named-sequences",
+                "named-sequence",
+                VersionInfo.getInstance(5, 0, 0),
+                VersionInfo.getInstance(13, 0, 0),
+                ProvisionalNamedSequences_Detail,
+                false,
+                false),
+        NORMALIZATIONCORRECTIONS(
+                "normalization-corrections",
+                "normalization-correction",
+                VersionInfo.getInstance(1, 1, 0),
+                null,
+                NormalizationCorrections_Detail,
+                true,
+                false),
+        STANDARDIZEDVARIANTS(
+                "standardized-variants",
+                "standardized-variant",
+                VersionInfo.getInstance(1, 1, 0),
+                null,
+                StandardizedVariants_Detail,
+                true,
+                false);
+        private final String tag;
+        private final String childTag;
+        private final VersionInfo minVersion;
+        private final VersionInfo maxVersion;
+        private final UCDSectionDetail ucdSectionDetail;
+        private final boolean parserWithRange;
+        private final boolean parserWithMissing;
+
+        UcdSection(
+                String tag,
+                String childTag,
+                VersionInfo minVersion,
+                VersionInfo maxVersion,
+                UCDSectionDetail ucdSectionDetail,
+                boolean parserWithRange,
+                boolean parserWithMissing) {
+            this.tag = tag;
+            this.childTag = childTag;
+            this.minVersion = minVersion;
+            this.maxVersion = maxVersion;
+            this.ucdSectionDetail = ucdSectionDetail;
+            this.parserWithRange = parserWithRange;
+            this.parserWithMissing = parserWithMissing;
+        }
+
+        public String toString() {
+            return tag;
+        }
+
+        public String getChildTag() {
+            return childTag;
+        }
+
+        public VersionInfo getMinVersion() {
+            return minVersion;
+        }
+
+        public VersionInfo getMaxVersion() {
+            return maxVersion;
+        }
+
+        public UCDSectionDetail getUcdSectionDetail() {
+            return ucdSectionDetail;
+        }
+
+        public boolean getParserWithRange() {
+            return parserWithRange;
+        }
+
+        public boolean getParserWithMissing() {
+            return parserWithMissing;
+        }
+    }
+
+    public static UCDSectionDetail Blocks_Detail =
+            new UCDSectionDetail(
+                    UcdSection.BLOCKS,
+                    new UCDSectionComponent[] {
+                        new UCDSectionComponent(
+                                VersionInfo.getInstance(1, 1, 0), null, UcdProperty.Block)
+                    },
+                    0);
+    public static UCDSectionDetail NamedSequences_Detail =
+            new UCDSectionDetail(
+                    UcdSection.NAMEDSEQUENCES,
+                    new UCDSectionComponent[] {
+                        new UCDSectionComponent(
+                                VersionInfo.getInstance(1, 1, 0), null, UcdProperty.Named_Sequences)
+                    },
+                    1);
+    public static UCDSectionDetail ProvisionalNamedSequences_Detail =
+            new UCDSectionDetail(
+                    UcdSection.PROVISIONALNAMEDSEQUENCES,
+                    new UCDSectionComponent[] {
+                        new UCDSectionComponent(
+                                VersionInfo.getInstance(5, 0, 0),
+                                VersionInfo.getInstance(13, 0, 0),
+                                UcdProperty.Named_Sequences_Prov)
+                    },
+                    1);
+    public static UCDSectionDetail NormalizationCorrections_Detail =
+            new UCDSectionDetail(
+                    UcdSection.NORMALIZATIONCORRECTIONS,
+                    new UCDSectionComponent[] {
+                        new UCDSectionComponent(
+                                VersionInfo.getInstance(1, 1, 0), null, UcdProperty.NC_Original)
+                    },
+                    2);
+    public static UCDSectionDetail StandardizedVariants_Detail =
+            new UCDSectionDetail(
+                    UcdSection.STANDARDIZEDVARIANTS,
+                    new UCDSectionComponent[] {
+                        new UCDSectionComponent(
+                                VersionInfo.getInstance(1, 1, 0),
+                                null,
+                                UcdProperty.Standardized_Variant),
+                        new UCDSectionComponent(
+                                VersionInfo.getInstance(13, 0, 0),
+                                null,
+                                UcdProperty.emoji_variation_sequence)
+                    },
+                    3);
+    public static UCDSectionDetail CJKRadicals_Detail =
+            new UCDSectionDetail(
+                    UcdSection.CJKRADICALS,
+                    new UCDSectionComponent[] {
+                        new UCDSectionComponent(
+                                VersionInfo.getInstance(1, 1, 0), null, UcdProperty.CJK_Radical)
+                    },
+                    4);
+    public static UCDSectionDetail EmojiSources_Detail =
+            new UCDSectionDetail(
+                    UcdSection.EMOJISOURCES,
+                    new UCDSectionComponent[] {
+                        new UCDSectionComponent(
+                                VersionInfo.getInstance(1, 1, 0), null, UcdProperty.Emoji_DCM)
+                    },
+                    5);
+    public static UCDSectionDetail DoNotEmit_Detail =
+            new UCDSectionDetail(
+                    UcdSection.DONOTEMIT,
+                    new UCDSectionComponent[] {
+                        new UCDSectionComponent(
+                                VersionInfo.getInstance(1, 1, 0),
+                                null,
+                                UcdProperty.Do_Not_Emit_Type)
+                    },
+                    6);
+
+    private final UcdSection ucdSection;
+    private final UCDSectionComponent[] ucdSectionComponents;
+    private final int sortOrder;
+
+    private UCDSectionDetail(
+            UcdSection ucdSection, UCDSectionComponent[] ucdSectionComponents, int sortOrder) {
+        this.ucdSection = ucdSection;
+        this.ucdSectionComponents = ucdSectionComponents;
+        this.sortOrder = sortOrder;
+    }
+
+    public UcdSection getSection() {
+        return this.ucdSection;
+    }
+
+    public UCDSectionComponent[] getUcdSectionComponents() {
+        return this.ucdSectionComponents;
+    }
+
+    public int getSortOrder() {
+        return this.sortOrder;
+    }
+}
diff --git a/unicodetools/src/main/java/org/unicode/xml/UCDXML.java b/unicodetools/src/main/java/org/unicode/xml/UCDXML.java
new file mode 100644
index 000000000..d4c302e1d
--- /dev/null
+++ b/unicodetools/src/main/java/org/unicode/xml/UCDXML.java
@@ -0,0 +1,838 @@
+package org.unicode.xml;
+
+import com.ibm.icu.dev.tool.UOption;
+import com.ibm.icu.util.VersionInfo;
+import java.io.BufferedReader;
+import java.io.BufferedWriter;
+import java.io.File;
+import java.io.FileInputStream;
+import java.io.FileOutputStream;
+import java.io.IOException;
+import java.io.InputStreamReader;
+import java.io.OutputStreamWriter;
+import java.nio.charset.StandardCharsets;
+import java.util.ArrayList;
+import java.util.HashMap;
+import java.util.LinkedHashMap;
+import java.util.Locale;
+import java.util.Map;
+import java.util.Objects;
+import java.util.regex.Matcher;
+import java.util.regex.Pattern;
+import javax.xml.transform.TransformerConfigurationException;
+import org.unicode.props.IndexUnicodeProperties;
+import org.unicode.props.UcdProperty;
+import org.unicode.props.UcdPropertyValues;
+import org.unicode.text.utility.Settings;
+import org.xml.sax.SAXException;
+import org.xml.sax.helpers.AttributesImpl;
+
+/**
+ * Utility for generating UCDXML files. The utility can build flat or grouped versions of UCDXML for
+ * non-Unihan code points, Unihan code points, or the complete range of code points.
+ */
+public class UCDXML {
+
+    private static final String NAMESPACE = "http://www.unicode.org/ns/2003/ucd/1.0";
+
+    private enum UCDXMLOUTPUTRANGE {
+        ALL,
+        NOUNIHAN,
+        UNIHAN;
+    }
+
+    private enum UCDXMLOUTPUTTYPE {
+        FLAT,
+        GROUPED;
+    }
+
+    private enum Range {
+        RESERVED("reserved"),
+        SURROGATE("surrogate"),
+        NONCHARACTER("noncharacter"),
+        CHARACTER("char"),
+        CJKUNIFIEDIDEOGRAPH("char"),
+        NONRANGE("nonrange");
+
+        private final String tag;
+
+        Range(String tag) {
+            this.tag = tag;
+        }
+
+        public String toString() {
+            return tag;
+        }
+    }
+
+    private static final UOption[] options = {
+        UOption.HELP_H(),
+        UOption.create("ucdversion", 'v', UOption.OPTIONAL_ARG),
+        UOption.create("range", 'r', UOption.REQUIRES_ARG),
+        UOption.create("output", 'o', UOption.REQUIRES_ARG),
+        UOption.create("outputfolder", 'f', UOption.OPTIONAL_ARG)
+    };
+    private static final int HELP = 0, UCDVERSION = 1, RANGE = 2, OUTPUT = 3, OUTPUTFOLDER = 4;
+
+    public static void main(String[] args) throws Exception {
+
+        VersionInfo ucdVersion = null;
+        UCDXMLOUTPUTRANGE[] ucdxmloutputranges =
+                new UCDXMLOUTPUTRANGE[] {
+                    UCDXMLOUTPUTRANGE.ALL, UCDXMLOUTPUTRANGE.NOUNIHAN, UCDXMLOUTPUTRANGE.UNIHAN
+                };
+        UCDXMLOUTPUTTYPE[] ucdxmloutputtypes =
+                new UCDXMLOUTPUTTYPE[] {UCDXMLOUTPUTTYPE.FLAT, UCDXMLOUTPUTTYPE.GROUPED};
+        File destinationFolder = null;
+
+        UOption.parseArgs(args, options);
+
+        if (options[HELP].doesOccur) {
+            System.out.println(
+                    "UCDXML [--ucdversion {version number}] [--outputfolder {destination}] "
+                            + "--range [ALL|NOUNIHAN|UNIHAN] --output [FLAT|GROUPED]");
+            System.exit(0);
+        }
+
+        try {
+            if (options[UCDVERSION].doesOccur) {
+                try {
+                    ucdVersion = VersionInfo.getInstance(options[UCDVERSION].value);
+                } catch (Exception e) {
+                    throw new IllegalArgumentException(
+                            "Could not convert "
+                                    + options[UCDVERSION].value
+                                    + " to a valid UCD version");
+                }
+            } else {
+                ucdVersion = VersionInfo.getInstance(Settings.latestVersion);
+            }
+            if (options[RANGE].doesOccur) {
+                try {
+                    ucdxmloutputranges =
+                            new UCDXMLOUTPUTRANGE[] {
+                                UCDXMLOUTPUTRANGE.valueOf(
+                                        options[RANGE].value.toUpperCase(Locale.ROOT))
+                            };
+                } catch (Exception e) {
+                    throw new IllegalArgumentException(
+                            "Could not convert "
+                                    + options[RANGE].value
+                                    + " to one of [ALL|NOUNIHAN|UNIHAN]");
+                }
+            }
+            if (options[OUTPUT].doesOccur) {
+                try {
+                    ucdxmloutputtypes =
+                            new UCDXMLOUTPUTTYPE[] {
+                                UCDXMLOUTPUTTYPE.valueOf(
+                                        options[OUTPUT].value.toUpperCase(Locale.ROOT))
+                            };
+                } catch (Exception e) {
+                    throw new IllegalArgumentException(
+                            "Could not convert "
+                                    + options[OUTPUT].value
+                                    + " to one of [FLAT|GROUPED]");
+                }
+            }
+            if (options[OUTPUTFOLDER].doesOccur) {
+                try {
+                    destinationFolder =
+                            new File(
+                                    options[OUTPUTFOLDER].value
+                                            + ucdVersion.getVersionString(3, 3)
+                                            + "/");
+                    if (!destinationFolder.exists()) {
+                        if (!destinationFolder.mkdirs()) {
+                            throw new IOException();
+                        }
+                    }
+                } catch (Exception e) {
+                    throw new IllegalArgumentException(
+                            "Could not find or create " + options[OUTPUTFOLDER].value);
+                }
+            } else {
+                try {
+                    destinationFolder =
+                            new File(
+                                    Settings.Output.GEN_DIR
+                                            + "ucdxml\\"
+                                            + ucdVersion.getVersionString(3, 3)
+                                            + "\\");
+                    if (!destinationFolder.exists()) {
+                        if (!destinationFolder.mkdirs()) {
+                            throw new IOException();
+                        }
+                    }
+                } catch (Exception e) {
+                    throw new IllegalArgumentException(
+                            "Could not find or create "
+                                    + Settings.Output.GEN_DIR
+                                    + "ucdxml\\"
+                                    + ucdVersion.getVersionString(3, 3)
+                                    + "\\");
+                }
+            }
+
+        } catch (Exception e) {
+            System.err.println(e.getMessage());
+            System.exit(1);
+        }
+
+        if (ucdVersion != null && destinationFolder.exists()) {
+            for (UCDXMLOUTPUTRANGE ucdxmloutputrange : ucdxmloutputranges) {
+                for (UCDXMLOUTPUTTYPE ucdxmloutputtype : ucdxmloutputtypes) {
+                    System.out.println(
+                            "Building the "
+                                    + ucdxmloutputrange
+                                    + " "
+                                    + ucdxmloutputtype
+                                    + " UcdXML file for "
+                                    + ucdVersion);
+                    buildUcdXMLFile(
+                            ucdVersion, destinationFolder, ucdxmloutputrange, ucdxmloutputtype);
+                }
+            }
+            System.out.println("End");
+            System.exit(0);
+        } else {
+            System.err.println("Unexpected error when building UcdXML file.");
+            System.exit(1);
+        }
+    }
+
+    private static void buildUcdXMLFile(
+            VersionInfo ucdVersion,
+            File destinationFolder,
+            UCDXMLOUTPUTRANGE outputRange,
+            UCDXMLOUTPUTTYPE outputType)
+            throws IOException, TransformerConfigurationException, SAXException {
+        int lowCodePoint = 0x0;
+        int highCodePoint = 0x10FFFF;
+        // Tangut
+        // int lowCodePoint = 0x17000;
+        // int highCodePoint = 0x1B2FB;
+        // 0x10FFFF
+
+        File tempFile = new File(destinationFolder, "temp.xml");
+        String outputFilename =
+                "ucd."
+                        + outputRange.toString().toLowerCase(Locale.ROOT)
+                        + "."
+                        + outputType.toString().toLowerCase(Locale.ROOT)
+                        + ".xml";
+        File destinationFile = new File(destinationFolder, outputFilename);
+
+        FileOutputStream fileOutputStream = new FileOutputStream(tempFile);
+        UCDXMLWriter writer = new UCDXMLWriter(fileOutputStream);
+
+        IndexUnicodeProperties iup = IndexUnicodeProperties.make(ucdVersion);
+        AttributeResolver attributeResolver = new AttributeResolver(iup);
+        UCDDataResolver ucdDataResolver = new UCDDataResolver(iup, NAMESPACE, writer);
+
+        writer.startFile();
+        writer.startElement("ucd");
+        {
+            writer.startElement("description");
+            {
+                writer.addContent("Unicode " + ucdVersion.getVersionString(3, 3));
+                writer.endElement("description");
+            }
+            buildRepertoire(
+                    writer,
+                    attributeResolver,
+                    ucdVersion,
+                    lowCodePoint,
+                    highCodePoint,
+                    outputRange,
+                    outputType);
+            if (outputRange != UCDXMLOUTPUTRANGE.UNIHAN) {
+                ucdDataResolver.buildSection(UCDSectionDetail.UcdSection.BLOCKS);
+                ucdDataResolver.buildSection(UCDSectionDetail.UcdSection.NAMEDSEQUENCES);
+                ucdDataResolver.buildSection(UCDSectionDetail.UcdSection.PROVISIONALNAMEDSEQUENCES);
+                ucdDataResolver.buildSection(UCDSectionDetail.UcdSection.NORMALIZATIONCORRECTIONS);
+                ucdDataResolver.buildSection(UCDSectionDetail.UcdSection.STANDARDIZEDVARIANTS);
+                if (ucdVersion.compareTo(VersionInfo.getInstance(5, 2, 0)) >= 0) {
+                    ucdDataResolver.buildSection(UCDSectionDetail.UcdSection.CJKRADICALS);
+                }
+                if (ucdVersion.compareTo(VersionInfo.getInstance(6, 0, 0)) >= 0) {
+                    ucdDataResolver.buildSection(UCDSectionDetail.UcdSection.EMOJISOURCES);
+                }
+                if (ucdVersion.compareTo(VersionInfo.getInstance(16, 0, 0)) >= 0) {
+                    ucdDataResolver.buildSection(UCDSectionDetail.UcdSection.DONOTEMIT);
+                }
+            }
+            writer.endElement("ucd");
+        }
+        writer.endFile();
+        fileOutputStream.close();
+        cleanUcdXMLFile(tempFile, destinationFile);
+        if (!tempFile.delete()) {
+            throw new IOException("Could not delete temporary file " + tempFile);
+        }
+    }
+
+    private static void cleanUcdXMLFile(File tempFile, File destinationFile) throws IOException {
+        // XALAN writes out characters outside the BMP as entities.
+        // Use this code to replace the entities with the correct characters.
+        // See: https://issues.apache.org/jira/browse/XALANJ-2595
+
+        FileInputStream fileInputStream = new FileInputStream(tempFile);
+        FileOutputStream fileOutputStream = new FileOutputStream(destinationFile);
+
+        InputStreamReader inputStreamReader =
+                new InputStreamReader(fileInputStream, StandardCharsets.UTF_8);
+        OutputStreamWriter outputStreamWriter =
+                new OutputStreamWriter(fileOutputStream, StandardCharsets.UTF_8);
+
+        BufferedReader bufferedReader = new BufferedReader(inputStreamReader);
+        BufferedWriter bufferedWriter = new BufferedWriter(outputStreamWriter);
+
+        String line;
+        while ((line = bufferedReader.readLine()) != null) {
+            Matcher matcher = Pattern.compile("&#(\\d+);").matcher(line);
+            line =
+                    matcher.replaceAll(
+                            matchResult ->
+                                    new String(
+                                            Character.toChars(Integer.parseInt(matcher.group(1)))));
+            bufferedWriter.append(line);
+            bufferedWriter.newLine();
+        }
+        bufferedWriter.flush();
+        fileInputStream.close();
+        fileOutputStream.close();
+    }
+
+    private static void buildRepertoire(
+            UCDXMLWriter writer,
+            AttributeResolver attributeResolver,
+            VersionInfo ucdVersion,
+            int lowCodePoint,
+            int highCodePoint,
+            UCDXMLOUTPUTRANGE outputRange,
+            UCDXMLOUTPUTTYPE outputType)
+            throws SAXException {
+
+        writer.startElement("repertoire");
+        {
+            for (int CodePoint = lowCodePoint; CodePoint <= highCodePoint; CodePoint++) {
+                if (isWritableCodePoint(CodePoint, outputRange, attributeResolver)) {
+                    if (outputType == UCDXMLOUTPUTTYPE.GROUPED) {
+                        CodePoint =
+                                buildGroup(
+                                        writer,
+                                        attributeResolver,
+                                        ucdVersion,
+                                        CodePoint,
+                                        highCodePoint,
+                                        outputRange,
+                                        outputType);
+                    } else {
+                        CodePoint =
+                                buildChars(
+                                        writer,
+                                        attributeResolver,
+                                        ucdVersion,
+                                        CodePoint,
+                                        highCodePoint,
+                                        outputRange,
+                                        outputType,
+                                        null);
+                    }
+                }
+            }
+            writer.endElement("repertoire");
+        }
+    }
+
+    private static int buildGroup(
+            UCDXMLWriter writer,
+            AttributeResolver attributeResolver,
+            VersionInfo ucdVersion,
+            int lowCodePoint,
+            int highCodePoint,
+            UCDXMLOUTPUTRANGE outputRange,
+            UCDXMLOUTPUTTYPE outputType)
+            throws SAXException {
+
+        int lastCodePointInGroup =
+                getLastCodePointInGroup(attributeResolver, lowCodePoint, highCodePoint);
+
+        AttributesImpl groupAttrs =
+                getGroupAttributes(
+                        ucdVersion,
+                        attributeResolver,
+                        lowCodePoint,
+                        lastCodePointInGroup,
+                        outputRange);
+
+        writer.startElement("group", groupAttrs);
+        {
+            buildChars(
+                    writer,
+                    attributeResolver,
+                    ucdVersion,
+                    lowCodePoint,
+                    lastCodePointInGroup,
+                    outputRange,
+                    outputType,
+                    groupAttrs);
+            writer.endElement("group");
+        }
+        return lastCodePointInGroup;
+    }
+
+    private static int buildChars(
+            UCDXMLWriter writer,
+            AttributeResolver attributeResolver,
+            VersionInfo ucdVersion,
+            int lowCodePoint,
+            int highCodePoint,
+            UCDXMLOUTPUTRANGE outputRange,
+            UCDXMLOUTPUTTYPE outputType,
+            AttributesImpl groupAttrs)
+            throws SAXException {
+
+        ArrayList<Integer> range = new ArrayList<>();
+        Range rangeType = Range.NONRANGE;
+        for (int CodePoint = lowCodePoint; CodePoint <= highCodePoint; CodePoint++) {
+            if (attributeResolver.isUnassignedCodePoint(CodePoint)
+                    || (outputRange == UCDXMLOUTPUTRANGE.NOUNIHAN
+                            && attributeResolver.isUnifiedIdeograph(CodePoint))) {
+                Range currentRangeType = getRangeType(attributeResolver, CodePoint);
+                if (!range.isEmpty()) {
+                    if (!currentRangeType.equals(rangeType)
+                            || attributeResolver.isDifferentRange(
+                                    ucdVersion, CodePoint, CodePoint - 1)) {
+                        if (outputRange != UCDXMLOUTPUTRANGE.UNIHAN) {
+                            if (outputType == UCDXMLOUTPUTTYPE.GROUPED) {
+                                buildGroupedRange(
+                                        writer,
+                                        attributeResolver,
+                                        ucdVersion,
+                                        range,
+                                        rangeType,
+                                        groupAttrs);
+                            } else {
+                                buildUngroupedRange(
+                                        writer, attributeResolver, ucdVersion, range, rangeType);
+                            }
+                        }
+                        range.clear();
+                    }
+                }
+                range.add(CodePoint);
+                rangeType = currentRangeType;
+            } else {
+                if (!range.isEmpty()) {
+                    if (outputRange != UCDXMLOUTPUTRANGE.UNIHAN) {
+                        if (outputType == UCDXMLOUTPUTTYPE.GROUPED) {
+                            buildGroupedRange(
+                                    writer,
+                                    attributeResolver,
+                                    ucdVersion,
+                                    range,
+                                    rangeType,
+                                    groupAttrs);
+                        } else {
+                            buildUngroupedRange(
+                                    writer, attributeResolver, ucdVersion, range, rangeType);
+                        }
+                    }
+                    range.clear();
+                    rangeType = Range.NONRANGE;
+                }
+                if (isWritableCodePoint(CodePoint, outputRange, attributeResolver)) {
+                    if (outputType == UCDXMLOUTPUTTYPE.GROUPED) {
+                        buildGroupedChar(
+                                writer,
+                                attributeResolver,
+                                ucdVersion,
+                                CodePoint,
+                                outputRange,
+                                groupAttrs);
+                    } else {
+                        buildUngroupedChar(
+                                writer, attributeResolver, ucdVersion, CodePoint, outputRange);
+                    }
+                }
+            }
+        }
+        // Handle any range before the end of the repertoire element.
+        if (!range.isEmpty()) {
+            if (outputRange != UCDXMLOUTPUTRANGE.UNIHAN) {
+                if (outputType == UCDXMLOUTPUTTYPE.GROUPED) {
+                    buildGroupedRange(
+                            writer, attributeResolver, ucdVersion, range, rangeType, groupAttrs);
+                } else {
+                    buildUngroupedRange(writer, attributeResolver, ucdVersion, range, rangeType);
+                }
+            }
+        }
+        return highCodePoint;
+    }
+
+    private static void buildUngroupedChar(
+            UCDXMLWriter writer,
+            AttributeResolver attributeResolver,
+            VersionInfo ucdVersion,
+            int CodePoint,
+            UCDXMLOUTPUTRANGE outputRange)
+            throws SAXException {
+
+        AttributesImpl charAttributes =
+                getAttributes(ucdVersion, attributeResolver, CodePoint, outputRange);
+        buildChar(writer, attributeResolver, CodePoint, charAttributes);
+    }
+
+    private static void buildGroupedChar(
+            UCDXMLWriter writer,
+            AttributeResolver attributeResolver,
+            VersionInfo ucdVersion,
+            int CodePoint,
+            UCDXMLOUTPUTRANGE outputRange,
+            AttributesImpl groupAttrs)
+            throws SAXException {
+
+        AttributesImpl orgCharAttributes =
+                getAttributes(ucdVersion, attributeResolver, CodePoint, outputRange);
+        AttributesImpl charAttributes = new AttributesImpl();
+        charAttributes.addAttribute(
+                NAMESPACE, "cp", "cp", "CDATA", attributeResolver.getHexString(CodePoint));
+
+        for (UCDPropertyDetail propDetail : UCDPropertyDetail.ucdxmlValues()) {
+            String qName = propDetail.getUcdProperty().getShortName();
+            if (qName.startsWith("cjk")) {
+                qName = qName.substring(2);
+            }
+            String orgCharAttributesValue = orgCharAttributes.getValue(qName);
+            String groupAttributeValue = groupAttrs.getValue(qName);
+            if (!Objects.equals(orgCharAttributesValue, groupAttributeValue)) {
+                charAttributes.addAttribute(
+                        NAMESPACE,
+                        qName,
+                        qName,
+                        "CDATA",
+                        Objects.requireNonNullElse(orgCharAttributesValue, ""));
+            }
+        }
+        buildChar(writer, attributeResolver, CodePoint, charAttributes);
+    }
+
+    private static void buildChar(
+            UCDXMLWriter writer,
+            AttributeResolver attributeResolver,
+            int CodePoint,
+            AttributesImpl charAttributes)
+            throws SAXException {
+        writer.startElement("char", charAttributes);
+        {
+            HashMap<String, String> nameAliases = attributeResolver.getNameAliases(CodePoint);
+            if (null != nameAliases && !nameAliases.isEmpty()) {
+                for (String alias : nameAliases.keySet()) {
+                    AttributesImpl nameAliasAt = new AttributesImpl();
+                    nameAliasAt.addAttribute(NAMESPACE, "alias", "alias", "CDATA", alias);
+                    String type = nameAliases.get(alias);
+                    if (!Objects.equals(type, "none")) {
+                        nameAliasAt.addAttribute(
+                                NAMESPACE, "type", "type", "CDATA", nameAliases.get(alias));
+                    }
+                    writer.startElement("name-alias", nameAliasAt);
+                    {
+                        writer.endElement("name-alias");
+                    }
+                }
+            }
+            writer.endElement("char");
+        }
+    }
+
+    private static void buildGroupedRange(
+            UCDXMLWriter writer,
+            AttributeResolver attributeResolver,
+            VersionInfo ucdVersion,
+            ArrayList<Integer> range,
+            Range rangeType,
+            AttributesImpl groupAttrs)
+            throws SAXException {
+        AttributesImpl orgRangeAttributes =
+                getReservedAttributes(ucdVersion, attributeResolver, range);
+        AttributesImpl rangeAttributes = new AttributesImpl();
+        if (range.size() == 1) {
+            rangeAttributes.addAttribute(
+                    NAMESPACE, "cp", "cp", "CDATA", attributeResolver.getHexString(range.get(0)));
+        } else {
+            rangeAttributes.addAttribute(
+                    NAMESPACE,
+                    "first-cp",
+                    "first-cp",
+                    "CDATA",
+                    attributeResolver.getHexString(range.get(0)));
+            rangeAttributes.addAttribute(
+                    NAMESPACE,
+                    "last-cp",
+                    "last-cp",
+                    "CDATA",
+                    attributeResolver.getHexString(range.get(range.size() - 1)));
+        }
+
+        for (UCDPropertyDetail propDetail : UCDPropertyDetail.ucdxmlValues()) {
+            String qName = propDetail.getUcdProperty().getShortName();
+            if (qName.startsWith("cjk")) {
+                qName = qName.substring(2);
+            }
+            String orgCharAttributesValue = orgRangeAttributes.getValue(qName);
+            String groupAttributeValue = groupAttrs.getValue(qName);
+            if (!Objects.equals(orgCharAttributesValue, groupAttributeValue)) {
+                rangeAttributes.addAttribute(
+                        NAMESPACE,
+                        qName,
+                        qName,
+                        "CDATA",
+                        Objects.requireNonNullElse(orgCharAttributesValue, ""));
+            }
+        }
+        writer.startElement(rangeType.tag, rangeAttributes);
+        {
+            writer.endElement(rangeType.tag);
+        }
+    }
+
+    private static void buildUngroupedRange(
+            UCDXMLWriter writer,
+            AttributeResolver attributeResolver,
+            VersionInfo ucdVersion,
+            ArrayList<Integer> range,
+            Range rangeType)
+            throws SAXException {
+        AttributesImpl rangeAttributes =
+                getReservedAttributes(ucdVersion, attributeResolver, range);
+        writer.startElement(rangeType.tag, rangeAttributes);
+        {
+            writer.endElement(rangeType.tag);
+        }
+    }
+
+    private static boolean isWritableCodePoint(
+            int CodePoint, UCDXMLOUTPUTRANGE outputRange, AttributeResolver attributeResolver) {
+        return outputRange == UCDXMLOUTPUTRANGE.ALL
+                || (outputRange == UCDXMLOUTPUTRANGE.UNIHAN
+                        && attributeResolver.isUnihanAttributeRange(CodePoint))
+                || (outputRange == UCDXMLOUTPUTRANGE.NOUNIHAN
+                        && !attributeResolver.isUnifiedIdeograph(CodePoint));
+    }
+
+    private static Range getRangeType(AttributeResolver attributeResolver, int CodePoint) {
+        String NChar = attributeResolver.getNChar(CodePoint);
+        UcdPropertyValues.General_Category_Values gc = attributeResolver.getgc(CodePoint);
+
+        if (attributeResolver.isUnihanAttributeRange(CodePoint)) {
+            return Range.CJKUNIFIEDIDEOGRAPH;
+        }
+        if (gc.equals(UcdPropertyValues.General_Category_Values.Surrogate)) {
+            return Range.SURROGATE;
+        }
+        if (gc.equals(UcdPropertyValues.General_Category_Values.Private_Use)) {
+            return Range.CHARACTER;
+        }
+        if (NChar.equals(UcdPropertyValues.Binary.Yes.getShortName())) {
+            return Range.NONCHARACTER;
+        }
+        return Range.RESERVED;
+    }
+
+    private static int getLastCodePointInGroup(
+            AttributeResolver attributeResolver, int lowCodePoint, int highCodePoint) {
+        String blk = attributeResolver.getAttributeValue(UcdProperty.Block, lowCodePoint);
+        for (int CodePoint = lowCodePoint; CodePoint <= highCodePoint; CodePoint++) {
+            if (!blk.equals(attributeResolver.getAttributeValue(UcdProperty.Block, CodePoint))) {
+                return CodePoint - 1;
+            }
+            if (CodePoint == 0x20 - 1 // put the C0 controls in their own group
+                    || CodePoint == 0xa0 - 1 // put the C1 controls in their own group
+                    || CodePoint == 0x1160 - 1 // split the jamos into three groups
+                    || CodePoint == 0x11a8 - 1 // split the jamos into three groups
+                    || CodePoint == 0x1f1e6 - 1 // put the regional indicators in their own group
+            ) {
+                return CodePoint;
+            }
+        }
+        return highCodePoint;
+    }
+
+    private static AttributesImpl getAttributes(
+            VersionInfo version,
+            AttributeResolver attributeResolver,
+            int CodePoint,
+            UCDXMLOUTPUTRANGE outputRange) {
+        AttributesImpl attributes = new AttributesImpl();
+        attributes.addAttribute(
+                NAMESPACE, "cp", "cp", "CDATA", attributeResolver.getHexString(CodePoint));
+
+        for (UCDPropertyDetail propDetail : UCDPropertyDetail.ucdxmlValues()) {
+            UcdProperty prop = propDetail.getUcdProperty();
+            if (version.compareTo(propDetail.getMinVersion()) >= 0
+                    && (propDetail.getMaxVersion() == null
+                            || version.compareTo(propDetail.getMaxVersion()) < 0)) {
+                String attrValue = attributeResolver.getAttributeValue(prop, CodePoint);
+                boolean isAttributeIncluded =
+                        getIsAttributeIncluded(
+                                attrValue,
+                                attributeResolver.isUnihanAttributeRange(CodePoint),
+                                propDetail,
+                                prop,
+                                outputRange);
+                if (isAttributeIncluded) {
+                    String propName = prop.getShortName();
+                    if (propName.startsWith("cjk")) {
+                        propName = prop.getNames().getAllNames().get(1);
+                    }
+                    attributes.addAttribute(NAMESPACE, propName, propName, "CDATA", attrValue);
+                }
+            }
+        }
+        return attributes;
+    }
+
+    private static AttributesImpl getGroupAttributes(
+            VersionInfo version,
+            AttributeResolver attributeResolver,
+            int lowCodePoint,
+            int highCodePoint,
+            UCDXMLOUTPUTRANGE outputRange) {
+        AttributesImpl attributes = new AttributesImpl();
+
+        for (UCDPropertyDetail propDetail : UCDPropertyDetail.ucdxmlValues()) {
+            UcdProperty prop = propDetail.getUcdProperty();
+            if (version.compareTo(propDetail.getMinVersion()) >= 0
+                    && (propDetail.getMaxVersion() == null
+                            || version.compareTo(propDetail.getMaxVersion()) < 0)) {
+                int totalCount = 0;
+                Map<String, Integer> counters = new LinkedHashMap<>();
+
+                for (int CodePoint = lowCodePoint; CodePoint <= highCodePoint; CodePoint++) {
+                    if (!attributeResolver.isUnassignedCodePoint(CodePoint)) {
+                        String attrValue = attributeResolver.getAttributeValue(prop, CodePoint);
+                        int currentCount =
+                                (counters.get(attrValue) == null) ? 0 : counters.get(attrValue);
+                        currentCount++;
+                        totalCount++;
+                        counters.put(attrValue, currentCount);
+                    }
+                }
+                int max = Integer.MIN_VALUE;
+                String bestAttrValue = null;
+                for (String attrValue : counters.keySet()) {
+                    int thisCount = counters.get(attrValue);
+                    if (thisCount > max) {
+                        max = thisCount;
+                        bestAttrValue = attrValue;
+                    }
+                }
+                switch (prop) {
+                    case Decomposition_Mapping:
+                    case Simple_Uppercase_Mapping:
+                    case Simple_Lowercase_Mapping:
+                    case Simple_Titlecase_Mapping:
+                    case Uppercase_Mapping:
+                    case Lowercase_Mapping:
+                    case Titlecase_Mapping:
+                    case Simple_Case_Folding:
+                    case Case_Folding:
+                        if (bestAttrValue != null) {
+                            bestAttrValue = "#";
+                        }
+                }
+                if (max > 0.2 * totalCount && max > 1) {
+                    boolean isAttributeIncluded =
+                            getIsAttributeIncluded(
+                                    bestAttrValue,
+                                    attributeResolver.isUnihanAttributeRange(lowCodePoint),
+                                    propDetail,
+                                    prop,
+                                    outputRange);
+                    if (isAttributeIncluded) {
+                        String propName = prop.getShortName();
+                        if (propName.startsWith("cjk")) {
+                            propName = prop.getNames().getAllNames().get(1);
+                        }
+                        attributes.addAttribute(
+                                NAMESPACE, propName, propName, "CDATA", bestAttrValue);
+                    }
+                }
+            }
+        }
+        return attributes;
+    }
+
+    private static boolean getIsAttributeIncluded(
+            String attrValue,
+            boolean isUnihanAttributeRange,
+            UCDPropertyDetail propDetail,
+            UcdProperty prop,
+            UCDXMLOUTPUTRANGE outputRange) {
+        if (attrValue == null) {
+            return false;
+        }
+        if (isUnihanAttributeRange) {
+            if (outputRange == UCDXMLOUTPUTRANGE.UNIHAN) {
+                if (prop.equals(UcdProperty.Numeric_Type) && !attrValue.equals("None")) {
+                    return true;
+                }
+                if (prop.equals(UcdProperty.Numeric_Value) && !attrValue.equals("NaN")) {
+                    return true;
+                }
+                return propDetail.isCJKAttribute()
+                        && (propDetail.isCJKShowIfEmpty() || !attrValue.isEmpty());
+            }
+            if (outputRange == UCDXMLOUTPUTRANGE.NOUNIHAN && propDetail.isCJKAttribute()) {
+                return false;
+            }
+            if (propDetail.isCJKShowIfEmpty()) {
+                return true;
+            }
+        }
+        if (propDetail.isBaseAttribute()) {
+            return true;
+        }
+        return !attrValue.isEmpty();
+    }
+
+    private static AttributesImpl getReservedAttributes(
+            VersionInfo version, AttributeResolver attributeResolver, ArrayList<Integer> range) {
+        AttributesImpl attributes = new AttributesImpl();
+
+        if (range.size() == 1) {
+            attributes.addAttribute(
+                    NAMESPACE, "cp", "cp", "CDATA", attributeResolver.getHexString(range.get(0)));
+        } else {
+            attributes.addAttribute(
+                    NAMESPACE,
+                    "first-cp",
+                    "first-cp",
+                    "CDATA",
+                    attributeResolver.getHexString(range.get(0)));
+            attributes.addAttribute(
+                    NAMESPACE,
+                    "last-cp",
+                    "last-cp",
+                    "CDATA",
+                    attributeResolver.getHexString(range.get(range.size() - 1)));
+        }
+        for (UCDPropertyDetail propDetail : UCDPropertyDetail.baseValues()) {
+            UcdProperty prop = propDetail.getUcdProperty();
+            if (version.compareTo(propDetail.getMinVersion()) >= 0
+                    && (propDetail.getMaxVersion() == null
+                            || version.compareTo(propDetail.getMaxVersion()) <= 0)) {
+                String attrValue =
+                        attributeResolver.getAttributeValue(
+                                propDetail.getUcdProperty(), range.get(0));
+
+                attributes.addAttribute(
+                        NAMESPACE, prop.getShortName(), prop.getShortName(), "CDATA", attrValue);
+            }
+        }
+        return attributes;
+    }
+}
diff --git a/unicodetools/src/main/java/org/unicode/xml/UCDXMLWriter.java b/unicodetools/src/main/java/org/unicode/xml/UCDXMLWriter.java
new file mode 100644
index 000000000..7358ed26f
--- /dev/null
+++ b/unicodetools/src/main/java/org/unicode/xml/UCDXMLWriter.java
@@ -0,0 +1,77 @@
+package org.unicode.xml;
+
+import java.io.FileOutputStream;
+import java.text.SimpleDateFormat;
+import java.util.Date;
+import javax.xml.transform.OutputKeys;
+import javax.xml.transform.Transformer;
+import javax.xml.transform.TransformerConfigurationException;
+import javax.xml.transform.TransformerFactory;
+import javax.xml.transform.sax.SAXTransformerFactory;
+import javax.xml.transform.sax.TransformerHandler;
+import javax.xml.transform.stream.StreamResult;
+import org.xml.sax.SAXException;
+import org.xml.sax.helpers.AttributesImpl;
+
+/** Helper class for writing the contents for the UCDXML files. */
+public class UCDXMLWriter {
+
+    public static final String NAMESPACE = "http://www.unicode.org/ns/2003/ucd/1.0";
+
+    private final TransformerHandler transformerHandler;
+
+    public TransformerHandler getTransformerHandler() {
+        return transformerHandler;
+    }
+
+    public UCDXMLWriter(FileOutputStream f) throws TransformerConfigurationException {
+        TransformerFactory tfactory = TransformerFactory.newInstance();
+        SAXTransformerFactory sfactory = (SAXTransformerFactory) tfactory;
+        transformerHandler = sfactory.newTransformerHandler();
+        Transformer transformer = transformerHandler.getTransformer();
+        transformer.setOutputProperty(OutputKeys.ENCODING, "utf-8");
+        transformer.setOutputProperty(OutputKeys.METHOD, "xml");
+        transformer.setOutputProperty(OutputKeys.INDENT, "yes");
+        transformer.setOutputProperty(OutputKeys.STANDALONE, "yes");
+        transformer.setOutputProperty("{http://xml.apache.org/xslt}indent-amount", "3");
+        transformer.setOutputProperty("{http://xml.apache.org/xalan}indent-amount", "3");
+        transformerHandler.setResult(new StreamResult(f));
+    }
+
+    public void startFile() throws SAXException {
+        String copyrightYear = new SimpleDateFormat("yyyy").format(new Date());
+        transformerHandler.startDocument();
+        char[] c = "\n".toCharArray();
+        transformerHandler.characters(c, 0, c.length);
+        c = (" \u00A9 " + copyrightYear + " Unicode\u00AE, Inc. ").toCharArray();
+        transformerHandler.comment(c, 0, c.length);
+        c = "\n".toCharArray();
+        transformerHandler.characters(c, 0, c.length);
+        c = " For terms of use, see http://www.unicode.org/terms_of_use.html ".toCharArray();
+        transformerHandler.comment(c, 0, c.length);
+        c = "\n\n\n".toCharArray();
+        transformerHandler.characters(c, 0, c.length);
+    }
+
+    public void endFile() throws SAXException {
+        transformerHandler.endDocument();
+    }
+
+    public void startElement(String tagName) throws SAXException {
+        AttributesImpl attributes = new AttributesImpl();
+        startElement(tagName, attributes);
+    }
+
+    public void startElement(String tagName, AttributesImpl attributes) throws SAXException {
+        transformerHandler.startElement(NAMESPACE, tagName, tagName, attributes);
+    }
+
+    public void addContent(String s) throws SAXException {
+        char[] d = s.toCharArray();
+        transformerHandler.characters(d, 0, d.length);
+    }
+
+    public void endElement(String tagName) throws SAXException {
+        transformerHandler.endElement(NAMESPACE, tagName, tagName);
+    }
+}
diff --git a/unicodetools/src/main/java/org/unicode/xml/XMLProperties.java b/unicodetools/src/main/java/org/unicode/xml/XMLProperties.java
new file mode 100644
index 000000000..d1f6e178e
--- /dev/null
+++ b/unicodetools/src/main/java/org/unicode/xml/XMLProperties.java
@@ -0,0 +1,491 @@
+package org.unicode.xml;
+
+import com.ibm.icu.impl.UnicodeMap;
+import java.io.File;
+import java.io.FileInputStream;
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.EnumMap;
+import java.util.HashMap;
+import java.util.LinkedHashSet;
+import java.util.List;
+import java.util.Map;
+import java.util.Set;
+import org.unicode.cldr.util.XMLFileReader;
+import org.unicode.props.IndexUnicodeProperties;
+import org.unicode.props.UcdProperty;
+import org.unicode.text.utility.Utility;
+import org.xml.sax.*;
+
+/**
+ * Helper class for org.unicode.xml.CompareUCDXML. Facilitates traversal of the contents of a UCDXML
+ * file.
+ */
+public class XMLProperties {
+
+    enum XmlLeaf {
+        // Leaf
+        BLOCK,
+        BLOCKS,
+        CHAR,
+        CJK_RADICAL,
+        CJK_RADICALS,
+        DESCRIPTION,
+        DO_NOT_EMIT,
+        EMOJI_SOURCE,
+        EMOJI_SOURCES,
+        GROUP,
+        INSTEAD,
+        NAME_ALIAS,
+        NAMED_SEQUENCE,
+        NAMED_SEQUENCES,
+        NONCHARACTER,
+        NORMALIZATION_CORRECTION,
+        NORMALIZATION_CORRECTIONS,
+        PROVISIONAL_NAMED_SEQUENCES,
+        REPERTOIRE,
+        RESERVED,
+        STANDARDIZED_VARIANT,
+        STANDARDIZED_VARIANTS,
+        SURROGATE,
+        UCD;
+        static final XmlLeaf GREATEST_LEAF = NAME_ALIAS;
+        static final XmlLeaf GREATEST_BOTH = CHAR;
+
+        static XmlLeaf forString(String source) {
+            try {
+                return XmlLeaf.valueOf(source.toUpperCase().replace('-', '_'));
+            } catch (final Exception e) {
+                return null;
+            }
+        }
+    }
+
+    static class IntRange {
+        int start;
+        int end;
+    }
+
+    Map<UcdProperty, UnicodeMap<String>> property2data =
+            new EnumMap<UcdProperty, UnicodeMap<String>>(UcdProperty.class);
+
+    {
+        for (final UcdProperty prop : UcdProperty.values()) {
+            property2data.put(prop, new UnicodeMap<String>());
+        }
+    }
+
+    Set<String> leavesNotHandled = new LinkedHashSet<String>();
+
+    public XMLProperties(File ucdxmlFile) {
+        readFile(ucdxmlFile);
+
+        for (final UcdProperty prop : property2data.keySet()) {
+            final UnicodeMap<String> map = property2data.get(prop);
+            map.freeze();
+        }
+    }
+
+    public void readFile(File ucdxmlFile) {
+        try {
+            System.out.println("Reading: " + ucdxmlFile.toString());
+            final FileInputStream fis = new FileInputStream(ucdxmlFile);
+            final XMLReader xmlReader = XMLFileReader.createXMLReader(false);
+            xmlReader.setErrorHandler(new MyErrorHandler());
+            xmlReader.setContentHandler(new MyContentHandler());
+            final InputSource is = new InputSource(fis);
+            is.setSystemId(ucdxmlFile.toString());
+            xmlReader.parse(is);
+            fis.close();
+        } catch (final IOException | SAXException e) {
+            System.out.println("\t" + "Can't read " + ucdxmlFile);
+            System.out.println("\t" + e.getClass() + "\t" + e.getMessage());
+        }
+    }
+
+    class MyContentHandler implements ContentHandler {
+        IntRange cp = new IntRange();
+        HashMap<String, String> attributes = new HashMap<String, String>();
+        HashMap<String, String> groupAttributes = new HashMap<String, String>();
+        private final List<XmlLeaf> lastElements = new ArrayList<XmlLeaf>();
+
+        public MyContentHandler() {}
+
+        @Override
+        public void characters(char[] arg0, int arg1, int arg2) throws SAXException {
+            final String chars = String.valueOf(arg0, arg1, arg2).trim();
+            if (!chars.trim().isEmpty()
+                    && lastElements.get(lastElements.size() - 1) != XmlLeaf.DESCRIPTION) {
+                throw new IllegalArgumentException("Should have no element content");
+            }
+        }
+
+        @Override
+        public void endElement(String arg0, String arg1, String arg2) throws SAXException {
+            try {
+                if (lastElements.isEmpty()) {
+                    System.out.println(
+                            "endElement: can't remove last element. Args: "
+                                    + arg0
+                                    + ", "
+                                    + arg1
+                                    + ", "
+                                    + arg2);
+                } else {
+                    final XmlLeaf removed = lastElements.remove(lastElements.size() - 1);
+                }
+            } catch (ArrayIndexOutOfBoundsException e) {
+                throw new IllegalArgumentException(
+                        "endElement: can't remove last element. Args: "
+                                + arg0
+                                + ", "
+                                + arg1
+                                + ", "
+                                + arg2,
+                        e);
+            }
+        }
+
+        @Override
+        public void endDocument() throws SAXException {}
+
+        @Override
+        public void endPrefixMapping(String arg0) throws SAXException {}
+
+        @Override
+        public void ignorableWhitespace(char[] arg0, int arg1, int arg2) throws SAXException {}
+
+        @Override
+        public void processingInstruction(String arg0, String arg1) throws SAXException {}
+
+        @Override
+        public void setDocumentLocator(Locator arg0) {}
+
+        @Override
+        public void skippedEntity(String arg0) throws SAXException {}
+
+        @Override
+        public void startDocument() throws SAXException {}
+
+        @Override
+        public void startPrefixMapping(String arg0, String arg1) throws SAXException {}
+
+        @Override
+        public void startElement(
+                String namespaceURI, String localName, String qName, Attributes atts) {
+            try {
+                final XmlLeaf xmlLeaf = XmlLeaf.forString(qName);
+                if (xmlLeaf == null) {
+                    throw new IllegalArgumentException(qName);
+                }
+                lastElements.add(xmlLeaf);
+                // System.out.println("Added:\t" + lastElements);
+
+                if (xmlLeaf == XmlLeaf.GROUP) {
+                    groupAttributes.clear();
+                    addAttributes(atts, groupAttributes);
+                    return;
+                }
+                attributes.clear();
+                attributes.putAll(groupAttributes);
+                addAttributes(atts, attributes);
+                String cps;
+                switch (xmlLeaf) {
+                    case CHAR:
+                    case RESERVED:
+                    case SURROGATE:
+                    case NONCHARACTER:
+                        parseCp(attributes);
+                        for (final Map.Entry<String, String> entry : attributes.entrySet()) {
+                            doAttributes(entry.getKey(), entry.getValue());
+                        }
+                        if (xmlLeaf == XmlLeaf.NONCHARACTER) {
+                            property2data
+                                    .get(UcdProperty.Noncharacter_Code_Point)
+                                    .putAll(cp.start, cp.end, "Yes");
+                        }
+                        break;
+                    case BLOCK:
+                        parseCp(attributes);
+                        property2data
+                                .get(UcdProperty.Block)
+                                .putAll(cp.start, cp.end, attributes.get("name"));
+                        break;
+                    case NAMED_SEQUENCE:
+                        cps = Utility.fromHex(attributes.get("cps"));
+                        property2data
+                                .get(UcdProperty.Named_Sequences)
+                                .put(cps, attributes.get("name"));
+                        break;
+                    case CJK_RADICAL:
+                        final String number = attributes.get("number");
+                        setProp(
+                                Utility.fromHex(attributes.get("radical")),
+                                UcdProperty.CJK_Radical,
+                                number);
+                        setProp(
+                                Utility.fromHex(attributes.get("ideograph")),
+                                UcdProperty.CJK_Radical,
+                                number);
+                        break;
+                    case EMOJI_SOURCE:
+                        cps = Utility.fromHex(attributes.get("unicode"));
+                        setProp(cps, UcdProperty.Emoji_DCM, attributes.get("docomo"));
+                        setProp(cps, UcdProperty.Emoji_KDDI, attributes.get("kddi"));
+                        setProp(cps, UcdProperty.Emoji_SB, attributes.get("softbank"));
+                        break;
+                    case REPERTOIRE:
+                    case BLOCKS:
+                    case CJK_RADICALS:
+                    case EMOJI_SOURCES:
+                    case NAMED_SEQUENCES:
+                    case PROVISIONAL_NAMED_SEQUENCES:
+                    case NORMALIZATION_CORRECTIONS:
+                    case STANDARDIZED_VARIANTS:
+                    case DESCRIPTION:
+                    case DO_NOT_EMIT:
+                        // non-informational nodes, skip
+                        if (atts.getLength() != 0) {
+                            throw new IllegalArgumentException("Has attributes");
+                        }
+                        break;
+                    case UCD:
+                        if (atts.getLength() != 0) {
+                            throw new IllegalArgumentException(
+                                    "Has wrong number of attributes: " + attributes.entrySet());
+                        }
+                        break;
+                    case NAME_ALIAS:
+                        final String alias =
+                                attributes.get("alias") + "(" + attributes.get("type") + ")";
+                        appendProp(cp.start, UcdProperty.Name_Alias, alias);
+                        break;
+                    case STANDARDIZED_VARIANT:
+                        {
+                            String desc = attributes.get("desc");
+                            final String when = attributes.get("when");
+                            if (!when.isEmpty()) {
+                                desc = desc + "(" + when + ")";
+                            }
+                            cps = Utility.fromHex(attributes.get("cps"));
+                            appendProp(cps, UcdProperty.Standardized_Variant, desc);
+                            break;
+                        }
+                    case NORMALIZATION_CORRECTION:
+                        final String correction =
+                                "old: "
+                                        + attributes.get("old")
+                                        + " new: "
+                                        + attributes.get("new")
+                                        + " version: "
+                                        + attributes.get("version");
+                        cps = Utility.fromHex(attributes.get("cp"));
+                        appendProp(cps, UcdProperty.NC_Original, correction);
+                        break;
+                    case INSTEAD:
+                        final String instead =
+                                "use: "
+                                        + attributes.get("use")
+                                        + " because: "
+                                        + attributes.get("because");
+                        cps = attributes.get("of");
+                        appendProp(cps, UcdProperty.Do_Not_Emit_Preferred, instead);
+                        break;
+                    case GROUP:
+                        break; // handled above. Leaving case for clarity
+                    default:
+                        leavesNotHandled.add(qName);
+                        break;
+                }
+            } catch (final Exception e) {
+                System.out.println(
+                        "Exception: "
+                                + qName
+                                + "\t"
+                                + e.getClass().getName()
+                                + "\t"
+                                + e.getMessage());
+            }
+        }
+
+        public void addAttributes(Attributes atts, Map<String, String> map) {
+            for (int i = 0; i < atts.getLength(); ++i) {
+                map.put(atts.getQName(i), atts.getValue(i));
+            }
+        }
+
+        public void setProp(String cps, UcdProperty ucdProperty, String docomo) {
+            if (docomo != null) {
+                property2data.get(ucdProperty).put(cps, docomo);
+            }
+        }
+
+        public void setProp(int cps, UcdProperty ucdProperty, String docomo) {
+            if (docomo != null) {
+                property2data.get(ucdProperty).put(cps, docomo);
+            }
+        }
+
+        public void appendProp(int cps, UcdProperty ucdProperty, String docomo) {
+            final UnicodeMap<String> unicodeMap = property2data.get(ucdProperty);
+            final String former = unicodeMap.get(cps);
+            unicodeMap.put(cps, former == null ? docomo : former + "; " + docomo);
+        }
+
+        public void appendProp(String cps, UcdProperty ucdProperty, String docomo) {
+            final UnicodeMap<String> unicodeMap = property2data.get(ucdProperty);
+            final String former = unicodeMap.get(cps);
+            unicodeMap.put(cps, former == null ? docomo : former + "; " + docomo);
+        }
+
+        public void parseCp(HashMap<String, String> attributes2) {
+            final String cpString = attributes2.get("cp");
+            if (cpString != null) {
+                cp.start = cp.end = Integer.parseInt(cpString, 16);
+            } else {
+                cp.start = Integer.parseInt(attributes2.get("first-cp"), 16);
+                cp.end = Integer.parseInt(attributes2.get("last-cp"), 16);
+            }
+        }
+
+        public UnicodeMap<String> doAttributes(String key, String value) {
+            UcdProperty prop = UcdProperty.forString(key);
+            //            if (prop == UcdProperty.Deprecated && cp.start > 0xE0000 && cp.start <
+            // 0xE00FF) {
+            //                System.out.println(Utility.hex(cp.start) + "," + Utility.hex(cp.end) +
+            // "\t" + key + "\t" + value);
+            //            }
+            if (prop == null) {
+                if (key.endsWith("cp")) {
+                    if (key.equals("cp") || key.equals("last-cp") || key.equals("first-cp")) {
+                        return null;
+                    }
+                } else if (key.equals("InSC")) {
+                    prop = UcdProperty.Indic_Syllabic_Category;
+                } else if (key.equals("InMC")) {
+                    prop = UcdProperty.Indic_Syllabic_Category;
+                }
+                if (prop == null) {
+                    return null;
+                }
+            }
+            final UnicodeMap<String> data = property2data.get(prop);
+            if (data == null) {
+                System.out.println("can't get data for " + key);
+                return null;
+            }
+            data.putAll(cp.start, cp.end, value.intern());
+            return data;
+        }
+    }
+
+    static class MyErrorHandler implements ErrorHandler {
+        @Override
+        public void error(SAXParseException exception) throws SAXException {
+            // System.out.println("\nerror: " + XMLFileReader.showSAX(exception));
+            throw exception;
+        }
+
+        @Override
+        public void fatalError(SAXParseException exception) throws SAXException {
+            // System.out.println("\nfatalError: " + XMLFileReader.showSAX(exception));
+            throw exception;
+        }
+
+        @Override
+        public void warning(SAXParseException exception) throws SAXException {
+            // System.out.println("\nwarning: " + XMLFileReader.showSAX(exception));
+            throw exception;
+        }
+    }
+
+    public UnicodeMap<String> getMap(UcdProperty prop) {
+        return property2data.get(prop);
+    }
+
+    public Set<String> getLeavesNotHandled() {
+        return leavesNotHandled;
+    }
+
+    static String show(String ival) {
+        if (ival == null) {
+            return "null";
+        } else if (ival.isEmpty()) {
+            return "<empty>";
+        } else if (ival.codePointAt(0) < 0x20) {
+            return "\\u{" + Utility.hex(ival, 4) + "}";
+        }
+        return "«" + ival + "»";
+    }
+
+    //    private static final String NO_VALUE =
+    // IndexUnicodeProperties.DefaultValueType.NO_VALUE.toString();
+    //    private static final String NAN = IndexUnicodeProperties.DefaultValueType.NaN.toString();
+
+    static final boolean HACK_XML_DEFAULTS = false;
+
+    public static String getXmlResolved(UcdProperty property, int codePoint, String propertyValue) {
+        if (property == UcdProperty.Name) {
+            int debug = 0;
+        }
+        switch (property.getType()) {
+            case Binary:
+                if (HACK_XML_DEFAULTS) {
+                    if (propertyValue == null) {
+                        propertyValue = "No";
+                    } else {
+                        propertyValue =
+                                IndexUnicodeProperties.normalizeValue(property, propertyValue);
+                    }
+                    break;
+                }
+                // $FALL-THROUGH$
+            case Enumerated:
+            case Catalog:
+                if (propertyValue != null) {
+                    propertyValue = IndexUnicodeProperties.normalizeValue(property, propertyValue);
+                }
+                break;
+            case Numeric:
+                //            if (HACK_XML_DEFAULTS) {
+                //                if (propertyValue == null || propertyValue.isEmpty()) {
+                //                    propertyValue = "NaN";
+                //                }
+                //            }
+                switch (property) {
+                    case kOtherNumeric:
+                    case kPrimaryNumeric:
+                    case kAccountingNumeric:
+                        if (propertyValue == null || propertyValue.isEmpty()) {
+                            propertyValue = "NaN";
+                        }
+                        break;
+                }
+                break;
+            case Miscellaneous:
+                if (propertyValue != null) {
+                    switch (property) {
+                        case Script_Extensions:
+                            propertyValue =
+                                    IndexUnicodeProperties.normalizeValue(property, propertyValue);
+                            break;
+                            //                case Name:
+                            //                    break;
+                        default:
+                            propertyValue = propertyValue.replace("#", Utility.hex(codePoint));
+                    }
+                }
+                break;
+            case String:
+                if (propertyValue != null) {
+                    propertyValue = propertyValue.replace("#", Utility.hex(codePoint));
+                    propertyValue = Utility.fromHex(propertyValue);
+                }
+                break;
+            default:
+                break;
+        }
+        return propertyValue;
+        // return propertyValue == null ? "<none>" : propertyValue;
+    }
+}
diff --git a/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyAliases.txt b/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyAliases.txt
index 7d4ce84e7..0f9cbda3d 100644
--- a/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyAliases.txt
+++ b/unicodetools/src/main/resources/org/unicode/props/ExtraPropertyAliases.txt
@@ -67,6 +67,7 @@ CJKR ; CJK_Radical
 EDCM ; Emoji_DCM
 EKDDI ; Emoji_KDDI
 ESB ; Emoji_SB
+EVS ; emoji_variation_sequence
 NS ; Named_Sequences
 NSP ; Named_Sequences_Prov
 SV ; Standardized_Variant
@@ -160,6 +161,9 @@ cjkJoyoKanji ; kJoyoKanji
 cjkKoreanEducationHanja ; kKoreanEducationHanja
 cjkKoreanName ; kKoreanName
 cjkTGH ; kTGH
+ncCorrected ; NC_Corrected
+ncOriginal ; NC_Original
+ncVersion ; NC_Version
 # 13.0
 cjkSpoofingVariant       ; kSpoofingVariant
 cjkTGHZ2013              ; kTGHZ2013
@@ -187,4 +191,4 @@ kReading                 ; kReading
 
 kEH_Func                 ; kEH_Func
 kEH_FVal                 ; kEH_FVal
-kEH_UniK                 ; kEH_UniK
\ No newline at end of file
+kEH_UniK                 ; kEH_UniK
diff --git a/unicodetools/src/main/resources/org/unicode/props/IndexPropertyRegex.txt b/unicodetools/src/main/resources/org/unicode/props/IndexPropertyRegex.txt
index a9b3e9f12..e280c7ff2 100644
--- a/unicodetools/src/main/resources/org/unicode/props/IndexPropertyRegex.txt
+++ b/unicodetools/src/main/resources/org/unicode/props/IndexPropertyRegex.txt
@@ -44,9 +44,11 @@ $codePoint0 =   ($codePoints)?
 # Main data
 
 Bidi_Mirroring_Glyph ;        SINGLE_VALUED ;               $codePoint
+Bidi_Paired_Bracket ;         SINGLE_VALUED ;               $codePoint
 Simple_Lowercase_Mapping ;    SINGLE_VALUED ;               $codePoint
 Simple_Titlecase_Mapping ;    SINGLE_VALUED ;               $codePoint
 Simple_Uppercase_Mapping ;    SINGLE_VALUED ;               $codePoint
+Equivalent_Unified_Ideograph; SINGLE_VALUED ;               $codePoint
 
 NFKC_Casefold ;               SINGLE_VALUED ;               $codePoint0
 NFKC_Simple_Casefold ;        SINGLE_VALUED ;               $codePoint0
@@ -142,7 +144,7 @@ kHanYu ;                      MULTI_VALUED ;                 [1-8][0-9]{4}\.[0-3
 kIRGHanyuDaZidian ;           SINGLE_VALUED ;                [1-8][0-9]{4}\.[0-3][0-9][01]
 kCNS1992 ;                    SINGLE_VALUED ;                [1-9]-[0-9A-F]{4}
 kTotalStrokes ;               ORDERED ;                      [1-9][0-9]{0,2}
-kRSUnicode ;                  ORDERED ;                 [1-9][0-9]{0,2}\'?\.[0-9]{1,2}
+kRSUnicode ;                  ORDERED ;                      [1-9][0-9]{0,2}\'?\.[0-9]{1,2}
 kRSJapanese ;                 EXTENSIBLE ;                   [1-9][0-9]{0,2}\.[0-9]{1,2}
 kRSKanWa ;                    EXTENSIBLE ;                   [1-9][0-9]{0,2}\.[0-9]{1,2}
 kRSKangXi ;                   EXTENSIBLE ;                   [1-9][0-9]{0,2}\.[0-9]{1,2}
@@ -170,13 +172,13 @@ kHanyuPinlu ;                 MULTI_VALUED ;                 [a-z\x{308}]+[1-5]\
 kCantonese ;                  MULTI_VALUED ;                 [a-z]{1,6}[1-6]
 kTang ;                       MULTI_VALUED ;                 \*?[A-Za-z()\x{E6}\x{251}\x{259}\x{25B}\x{300}\x{30C}]+
 
-kJinmeiyoKanji ; 		      MULTI_VALUED ;                 (20[0-9]{2})(:U\+2?[0-9A-F]{4})?
-kJoyoKanji ; 		          MULTI_VALUED ;                 (20[0-9]{2})|(U\+2?[0-9A-F]{4})
+kJinmeiyoKanji ;              MULTI_VALUED ;                 (20[0-9]{2})(:U\+2?[0-9A-F]{4})?
+kJoyoKanji ;                  MULTI_VALUED ;                 (20[0-9]{2})|(U\+2?[0-9A-F]{4})
 kKoreanEducationHanja ;       MULTI_VALUED ;                 20[0-9]{2}
-kKoreanName ; 		          MULTI_VALUED ;                 (20[0-9]{2})(:U\+2?[0-9A-F]{4})*
-kTGH ; 		                  MULTI_VALUED ;      			 20[0-9]{2}:[1-9][0-9]{0,3}
+kKoreanName ;                 MULTI_VALUED ;                 (20[0-9]{2})(:U\+2?[0-9A-F]{4})*
+kTGH ;                        MULTI_VALUED ;                 20[0-9]{2}:[1-9][0-9]{0,3}
 
-kIRG_UKSource ;                SINGLE_VALUED ;                V[0-4]-[0-9A-F]{4}
+kIRG_UKSource ;               SINGLE_VALUED ;                V[0-4]-[0-9A-F]{4}
 kIRG_SSource ;                SINGLE_VALUED ;                V[0-4]-[0-9A-F]{4}
 
 # Unihan properties from 13.0 and later.  No regexes for now.
@@ -199,28 +201,37 @@ kZhuangNumeric ; MULTI_VALUED ; .*
 kFanqie ; MULTI_VALUED ; .*
 kZhuang ; MULTI_VALUED ; .*
 
+kSrc_NushuDuben ;             SINGLE_VALUED ;                [0-9]+\.[0-9]+
+kReading ;                    SINGLE_VALUED ;                [a-z]{1,6}[1-6]+
+kRSTUnicode ;                 SINGLE_VALUED ;                [0-9]+\.[0-9]+
+kTGT_MergedSrc ;              SINGLE_VALUED ;                L2008-[0-9A-F]{4,5}(-[0-9]{4,5})?
+
+NC_Original ;                 SINGLE_VALUED ;                [0-9A-F]{4,5}
+NC_Corrected ;                SINGLE_VALUED ;                [0-9A-F]{4,5}
+NC_Version ;                  SINGLE_VALUED ;                [0-9]\.[0-9]\.[0-9]
+
 # =============================
 # Catalog/Enum/Binary Properties
 # All not listed are SINGLE_VALUED ; null
 # =============================
 
-Script_Extensions		;	MULTI_VALUED	;				<enum> 
-Standardized_Variant	;	MULTI_VALUED	;				.* 
+Script_Extensions ;           MULTI_VALUED ;                 <enum> 
+Standardized_Variant ;        MULTI_VALUED ;                 .*
 
-Idn_Status				;	SINGLE_VALUED	;				<enum>
-Idn_Mapping				;	SINGLE_VALUED	;				$codePoints
-Idn_2008				;	SINGLE_VALUED	;				<enum>
+Idn_Status ;                  SINGLE_VALUED ;                <enum>
+Idn_Mapping ;                 SINGLE_VALUED ;                $codePoints
+Idn_2008 ;                    SINGLE_VALUED ;                <enum>
 
-Identifier_Status		;	SINGLE_VALUED	; 				<enum>
-Identifier_Type			;	MULTI_VALUED	;				<enum>
+Identifier_Status ;           SINGLE_VALUED ;                <enum>
+Identifier_Type ;             MULTI_VALUED ;                 <enum>
 
-Confusable_SL			;	SINGLE_VALUED	;				$codePoints
-Confusable_SA			;	SINGLE_VALUED	;				$codePoints
-Confusable_ML			;	SINGLE_VALUED	;				$codePoints
-Confusable_MA			;	SINGLE_VALUED	;				$codePoints
+Confusable_SL ;               SINGLE_VALUED ;                $codePoints
+Confusable_SA ;               SINGLE_VALUED ;                $codePoints
+Confusable_ML ;               SINGLE_VALUED ;                $codePoints
+Confusable_MA ;               SINGLE_VALUED ;                $codePoints
 
-#Emoji					;	SINGLE_VALUED	;				<enum>
-#Emoji_Presentation		;	SINGLE_VALUED	;				<enum>
-#Emoji_Modifier			;	SINGLE_VALUED	;				<enum>
-#Emoji_Modifier_Base		;	SINGLE_VALUED	;				<enum>
+#Emoji ;                       SINGLE_VALUED ;                <enum>
+#Emoji_Presentation ;          SINGLE_VALUED ;                <enum>
+#Emoji_Modifier ;              SINGLE_VALUED ;                <enum>
+#Emoji_Modifier_Base ;         SINGLE_VALUED ;                <enum>
 
diff --git a/unicodetools/src/main/resources/org/unicode/props/IndexUnicodeProperties.txt b/unicodetools/src/main/resources/org/unicode/props/IndexUnicodeProperties.txt
index f7c9da838..5ff7cbdf5 100644
--- a/unicodetools/src/main/resources/org/unicode/props/IndexUnicodeProperties.txt
+++ b/unicodetools/src/main/resources/org/unicode/props/IndexUnicodeProperties.txt
@@ -36,6 +36,8 @@ FileType ; Unihan_OtherMappings ; PropertyValue
 FileType ; Unihan_RadicalStrokeCounts ; PropertyValue
 FileType ; Unihan_Readings ; PropertyValue
 FileType ; Unihan_Variants ; PropertyValue
+FileType ; NushuSources ; PropertyValue
+FileType ; TangutSources ; PropertyValue
 
 # NameAliases File Type
 # Contains a multivalued property, where successive values are not in the same line, but are divided out on successive lines with the same code point
@@ -43,6 +45,7 @@ FileType ; Unihan_Variants ; PropertyValue
 FileType ; NameAliases ; NameAliases
 FileType ; NameAliasesProv ; NameAliases
 FileType ; StandardizedVariants ; StandardizedVariants
+FileType ; emoji-variation-sequences ; StandardizedVariants
 
 # CJKRadicals File Type
 
@@ -320,6 +323,15 @@ Unihan_Variants ; kSpoofingVariant
 Unihan_Variants ; kTraditionalVariant
 Unihan_Variants ; kZVariant
 
+NushuSources ; kSrc_NushuDuben
+NushuSources ; kReading
+TangutSources ; kRSTUnicode
+TangutSources ; kTGT_MergedSrc
+
+NormalizationCorrections ; NC_Original
+NormalizationCorrections ; NC_Corrected
+NormalizationCorrections ; NC_Version
+
 # Properties removed from Unihan before 5.1.
 # Point to a nonexistent file so that we don’t try to read them from the most recent monolithic
 # Unihan, as we would then get confused by the other (still-extant) properties in that file.
@@ -438,6 +450,7 @@ EmojiSources ; Emoji_SB ; 3
 NamedSequences ; Named_Sequences
 NamedSequencesProv ; Named_Sequences_Prov
 StandardizedVariants ; Standardized_Variant
+emoji-variation-sequences ; emoji-variation-sequence
 DoNotEmit ; Do_Not_Emit_Preferred ; 1
 DoNotEmit ; Do_Not_Emit_Type ; 2
 
@@ -488,15 +501,6 @@ emoji/*/emoji-zwj-sequences; RGI_Emoji_Zwj_Sequence
 
 #emoji/*/emoji-test ; Emoji_Short_Name
 
-
-FileType ; TangutSources ; PropertyValue
-TangutSources ; kTGT_MergedSrc
-TangutSources ; kRSTUnicode
-
-FileType ; NushuSources ; PropertyValue
-NushuSources ; kSrc_NushuDuben
-NushuSources ; kReading
-
 FileType ; Unikemet ; PropertyValue
 Unikemet ; kEH_Cat
 Unikemet ; kEH_Core
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/Bidi_C.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Bidi_C.xml
new file mode 100644
index 000000000..617113bf2
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Bidi_C.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="Bidi_C attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute Bidi_C { boolean }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/Bidi_M.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Bidi_M.xml
new file mode 100644
index 000000000..c1380221b
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Bidi_M.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="Bidi_M attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute Bidi_M { boolean }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/Emoji.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Emoji.xml
new file mode 100644
index 000000000..7c7873459
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Emoji.xml
@@ -0,0 +1,20 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="Emoji properties" id='schema.emoji-data'>
+  code-point-attributes &amp;=
+    attribute Emoji { boolean }?
+
+  code-point-attributes &amp;=
+    attribute EPres { boolean }?
+
+  code-point-attributes &amp;=
+    attribute EMod { boolean }?
+
+  code-point-attributes &amp;=
+    attribute EBase { boolean }?
+
+  code-point-attributes &amp;=
+    attribute EComp { boolean }?
+
+  code-point-attributes &amp;=
+    attribute ExtPict { boolean }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/InCB.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/InCB.xml
new file mode 100644
index 000000000..8340250dc
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/InCB.xml
@@ -0,0 +1,9 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="InCB attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute InCB { "Consonant"
+                   | "Extend"
+                   | "Linker"
+                   | "None"
+                   }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/InPC.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/InPC.xml
new file mode 100644
index 000000000..a7de62387
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/InPC.xml
@@ -0,0 +1,21 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="InPC attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute InPC { "Bottom"
+                   | "Bottom_And_Left"
+                   | "Bottom_And_Right"
+                   | "Left"
+                   | "Left_And_Right"
+                   | "NA"
+                   | "Overstruck"
+                   | "Right"
+                   | "Top"
+                   | "Top_And_Bottom"
+                   | "Top_And_Bottom_And_Left"
+                   | "Top_And_Bottom_And_Right"
+                   | "Top_And_Left"
+                   | "Top_And_Left_And_Right"
+                   | "Top_And_Right"
+                   | "Visual_Order_Left"
+                   }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/InSC.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/InSC.xml
new file mode 100644
index 000000000..ddddc27a4
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/InSC.xml
@@ -0,0 +1,42 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="InSC attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute InSC { "Avagraha"
+                   | "Bindu"
+                   | "Brahmi_Joining_Number"
+                   | "Cantillation_Mark"
+                   | "Consonant"
+                   | "Consonant_Dead"
+                   | "Consonant_Final"
+                   | "Consonant_Head_Letter"
+                   | "Consonant_Initial_Postfixed"
+                   | "Consonant_Killer"
+                   | "Consonant_Medial"
+                   | "Consonant_Placeholder"
+                   | "Consonant_Preceding_Repha"
+                   | "Consonant_Prefixed"
+                   | "Consonant_Subjoined"
+                   | "Consonant_Succeeding_Repha"
+                   | "Consonant_With_Stacker"
+                   | "Gemination_Mark"
+                   | "Invisible_Stacker"
+                   | "Joiner"
+                   | "Modifying_Letter"
+                   | "Non_Joiner"
+                   | "Nukta"
+                   | "Number"
+                   | "Number_Joiner"
+                   | "Other"
+                   | "Pure_Killer"
+                   | "Register_Shifter"
+                   | "Reordering_Killer"
+                   | "Syllable_Modifier"
+                   | "Tone_Letter"
+                   | "Tone_Mark"
+                   | "Virama"
+                   | "Visarga"
+                   | "Vowel"
+                   | "Vowel_Dependent"
+                   | "Vowel_Independent"
+                   }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/JSN.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/JSN.xml
new file mode 100644
index 000000000..568f5e270
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/JSN.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="JSN attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute JSN { xsd:string { pattern="[A-Z]{0,3}" } }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/Join_C.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Join_C.xml
new file mode 100644
index 000000000..4cbf1d0f0
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Join_C.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="joining properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute Join_C { boolean }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/Name_Alias.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Name_Alias.xml
new file mode 100644
index 000000000..c2b53b2fe
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Name_Alias.xml
@@ -0,0 +1,10 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="name-alias element" id='schema.properties'>
+  code-point-attributes &amp;=
+    element name-alias {
+      attribute alias { xsd:string { pattern="[a-zA-Z0-9]+(( -|- |[\-_ ])[a-zA-Z0-9]+)*" } }?,
+      attribute type  { "abbreviation" | "alternate"
+                      | "control" | "correction"
+                      | "figment"
+                      }? } *
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/Nushu.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Nushu.xml
new file mode 100644
index 000000000..8919bba32
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Nushu.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="Nushu data" id='schema.nushu'>
+  code-point-attributes &amp;=
+    attribute kSrc_NushuDuben { xsd:string { pattern="[0-9]+\.[0-9]+" } }?
+
+  code-point-attributes &amp;=
+    attribute kReading { xsd:string }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/Set_of_code_points.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Set_of_code_points.xml
new file mode 100644
index 000000000..a6ff2d092
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Set_of_code_points.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="Set of code points" id='schema.repertoire'>
+  set-of-code-points =
+     attribute cp { single-code-point }
+   | ( attribute first-cp { single-code-point },
+       attribute last-cp  { single-code-point } )
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/Tangut.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Tangut.xml
new file mode 100644
index 000000000..21e52208a
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Tangut.xml
@@ -0,0 +1,18 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="Tangut data" id='schema.tangut'>
+  code-point-attributes &amp;=
+    attribute kRSTUnicode { xsd:string { pattern="[0-9]+\.[0-9]+" } }?
+
+  code-point-attributes &amp;=
+    attribute kTGT_MergedSrc 
+     { xsd:string {pattern="L2008-[0-9A-F]{4,5}(-[0-9]{4,5})?"}
+     | xsd:string {pattern="L2006-[0-9]{4}"}
+     | xsd:string {pattern="L1997-[0-9]{4}"}
+     | xsd:string {pattern="L1986-[0-9]{4}"}
+     | xsd:string {pattern="S1968-[0-9]{4}"}
+     | xsd:string {pattern="N1966-[0-9]{3}(-[0-9A-Z]{3,4})?"}
+     | xsd:string {pattern="H2004-[A-Z]-[0-9]{4}"}
+     | xsd:string {pattern="L2012-[0-9]{4}"}
+     | xsd:string {pattern="UTN42-[0-9]{3}"}
+     }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/Unihan.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Unihan.xml
new file mode 100644
index 000000000..ba4c042f8
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/Unihan.xml
@@ -0,0 +1,347 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="Unihan properties" id='schema.properties'>
+  code-point-attributes &amp;= attribute kAccountingNumeric
+    { xsd:string { pattern="[0-9]+" } }?
+
+  code-point-attributes &amp;= attribute kAlternateTotalStrokes
+    { list { xsd:string { pattern="(\d+:[BHJKMPSUV]+)|-" }+ } }?
+
+  code-point-attributes &amp;= attribute kBigFive
+    { xsd:string { pattern="[0-9A-F]{4}'?" } }?
+
+  code-point-attributes &amp;= attribute kCangjie
+    { xsd:string { pattern="[A-Z]+" } }?
+
+  code-point-attributes &amp;= attribute kCantonese
+    { list { xsd:string { pattern="[a-z]{1,6}[1-6]" }+ } }?
+
+  code-point-attributes &amp;= attribute kCCCII
+    { list { xsd:string { pattern="[0-9A-F]{6}" }+ } }?
+
+  code-point-attributes &amp;= attribute kCheungBauer
+    { list { xsd:string { pattern="[0-9]{3}/[0-9]{2};[A-Z]*;[a-z1-6\[\]/,]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kCheungBauerIndex
+    { list { xsd:string { pattern="[0-9]{3}\.[01][0-9]" }+ } }?
+
+  code-point-attributes &amp;= attribute kCihaiT
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}\.[0-9]{3}" }+ } }?
+
+  code-point-attributes &amp;= attribute kCNS1986
+    { xsd:string { pattern="[12E]-[0-9A-F]{4}" } }?
+
+  code-point-attributes &amp;= attribute kCNS1992
+    { xsd:string { pattern="[1-9]-[0-9A-F]{4}" } }?
+
+  code-point-attributes &amp;= attribute kCompatibilityVariant
+    { "" | xsd:string { pattern="U\+[23]?[0-9A-F]{4}" } }?
+
+  code-point-attributes &amp;= attribute kCowles
+    { list { xsd:string { pattern="[0-9]{1,4}(\.[0-9]{1,2})?" }+ } }?
+
+  code-point-attributes &amp;= attribute kDaeJaweon
+    { xsd:string { pattern="[0-9]{4}\.[0-9]{2}[01]" } }?
+
+  code-point-attributes &amp;= attribute kDefinition
+    { xsd:string { pattern='[^\t"]+' } }?
+
+  code-point-attributes &amp;= attribute kEACC
+    { xsd:string { pattern="[0-9A-F]{6}" } }?
+
+  code-point-attributes &amp;= attribute kFanqie
+    { list { xsd:string { pattern="[\x{3400}-\x{4DBF}\x{4E00}-\x{9FFF}\x{20000}-\x{2A6DF}]{2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kFenn
+    { list { xsd:string { pattern="[0-9]+a?[A-KP*]" }+ } }?
+
+  code-point-attributes &amp;= attribute kFennIndex
+    { list { xsd:string { pattern="[0-9][0-9]{0,2}\.[01][0-9]" }+ } }?
+
+  code-point-attributes &amp;= attribute kFourCornerCode
+    { list { xsd:string { pattern="[0-9]{4}(\.[0-9])?" }+ } }?
+
+  code-point-attributes &amp;= attribute kGB0
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGB1
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGB3
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGB5
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGB7
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGB8
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGradeLevel
+    { xsd:string { pattern="[1-6]" } }?
+
+  code-point-attributes &amp;= attribute kGSR
+    { list { xsd:string { pattern="[0-9]{4}[a-vx-z]'?" }+ } }?
+
+  code-point-attributes &amp;= attribute kHangul
+    { list { xsd:string { pattern="[\x{1100}-\x{1112}][\x{1161}-\x{1175}][\x{11A8}-\x{11C2}]?:[01ENX]{1,3}" }+ } }?
+
+  code-point-attributes &amp;= attribute kHanYu
+    { list { xsd:string { pattern="[1-8][0-9]{4}\.[0-3][0-9][0-3]" }+ } }?
+
+  code-point-attributes &amp;= attribute kHanyuPinlu
+    { list { xsd:string { pattern="[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+\([0-9]+\)" }+ } }?
+
+  code-point-attributes &amp;= attribute kHanyuPinyin
+    { list { xsd:string { pattern="(\d{5}\.\d{2}0,)*\d{5}\.\d{2}0:([a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+,)*[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kHDZRadBreak
+    { xsd:string { pattern="[\x{2F00}-\x{2FD5}]\[U\+2F[0-9A-D][0-9A-F]\]:[1-8][0-9]{4}\.[0-3][0-9]0" } }?
+
+  code-point-attributes &amp;= attribute kHKGlyph
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kIBMJapan
+    { list { xsd:string { pattern="F[ABC][0-9A-F]{2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kIICore
+    { list { xsd:string { pattern="[ABC][GHJKMPT]{1,7}" }+ } }?
+
+  code-point-attributes &amp;= attribute kIRG_GSource
+    { "" | xsd:string { pattern="G[013578EKS]-[0-9A-F]{4}" }
+         | xsd:string { pattern="G4K(-\d{5})?" }
+         | xsd:string { pattern="G(DZ|GH|RM|WZ|XC|XH|ZH)-\d{4}\.\d{2}" }
+         | xsd:string { pattern="G(BK|CH|CY|HC)(-\d{4}\.\d{2})?" }
+         | xsd:string { pattern="GKX-\d{4}\.\d{2,3}" }
+         | xsd:string { pattern="G(HZ|HZR)-\d{5}\.\d{2}" }
+         | xsd:string { pattern="G(CE|FC|IDC23|OCD|XHZ)-\d{3}" }
+         | xsd:string { pattern="G(H|HF|LGYJ|PGLG|T)-\d{4}" }
+         | xsd:string { pattern="G(CYY|DM|JZ|KJ|XM|ZFY|ZJW|ZYS)-\d{5}" }
+         | xsd:string { pattern="G(FZ|IDC)-[0-9A-F]{4}" }
+         | xsd:string { pattern="GGFZ-\d{6}" }
+         | xsd:string { pattern="G(LK|Z)-\d{7}" }
+         | xsd:string { pattern="GU-[023][0-9A-F]{4}" }
+         | xsd:string { pattern="GZA-[123467]\d{5}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_HSource
+    { "" | xsd:string { pattern="H-[0-9A-F]{4}" }
+         | xsd:string { pattern="H(B[012])-[0-9A-F]{4}" }
+         | xsd:string { pattern="HD-[23]?[0-9A-F]{4}" }
+         | xsd:string { pattern="HU-[023][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_JSource
+    { "" | xsd:string { pattern="J[014]-[0-9A-F]{4}" }
+         | xsd:string { pattern="J3A?-[0-9A-F]{4}" }
+         | xsd:string { pattern="J13A?-[0-9A-F]{4}" }
+         | xsd:string { pattern="J14-[0-9A-F]{4}" }
+         | xsd:string { pattern="JA[34]?-[0-9A-F]{4}" }
+         | xsd:string { pattern="JARIB-[0-9A-F]{4}" }
+         | xsd:string { pattern="JH-(JT[ABC][0-9A-F]{3}S?|IB\d{4}|\d{6})" }
+         | xsd:string { pattern="JK-\d{5}" }
+         | xsd:string { pattern="JMJ-\d{6}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_KPSource
+    { "" | xsd:string { pattern="KP([01]-[0-9A-F]{4}|U-[023][0-9A-F]{4})" } }?
+
+  code-point-attributes &amp;= attribute kIRG_KSource
+    { "" | xsd:string { pattern="K[0-6]-[0-9A-F]{4}" }
+         | xsd:string { pattern="KC-\d{5}" }
+         | xsd:string { pattern="KU-[023][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_MSource
+    { "" | xsd:string { pattern="MA-[0-9A-F]{4}" }
+         | xsd:string { pattern="MB[12]-[0-9A-F]{4}" }
+         | xsd:string { pattern="MC-\d{5}" }
+         | xsd:string { pattern="MDH?-[23]?[0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_SSource
+    { "" | xsd:string { pattern="SAT-\d{5}" } }?
+
+  code-point-attributes &amp;= attribute kIRG_TSource
+    { "" | xsd:string { pattern="T([1-7A-F]|1[1-3])-[0-9A-F]{4}" }
+         | xsd:string { pattern="TU-[023][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_UKSource
+    { "" | xsd:string { pattern="UK-\d{5}" } }?
+
+  code-point-attributes &amp;= attribute kIRG_USource
+    { "" | xsd:string { pattern="UTC-\d{5}" } }?
+
+  code-point-attributes &amp;= attribute kIRG_VSource
+    { "" | xsd:string { pattern="V[0-4]-[0-9A-F]{4}" }
+         | xsd:string { pattern="VN-[023F][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRGDaeJaweon
+    { list { xsd:string { pattern="[0-9]{4}\.[0-9]{2}[01]" }+ } }?
+
+  code-point-attributes &amp;= attribute kIRGHanyuDaZidian
+    { list { xsd:string { pattern="[1-8][0-9]{4}\.[0-3][0-9][01]" }+ } }?
+
+  code-point-attributes &amp;= attribute kIRGKangXi
+    { list { xsd:string { pattern="[01][0-9]{3}\.[0-7][0-9][01]" }+ } }?
+
+  code-point-attributes &amp;= attribute kJa
+    { list { xsd:string { pattern="[0-9A-F]{4}S?" }+ } }?
+
+  code-point-attributes &amp;= attribute kJapanese
+    { list { xsd:string { pattern="[\x{3041}-\x{3096}\x{3099}\x{309A}\x{30A1}-\x{30FA}\x{30FC}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kJapaneseKun
+    { list { xsd:string { pattern="[A-Z]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kJapaneseOn
+    { list { xsd:string { pattern="[A-Z]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kJinmeiyoKanji
+    { list { xsd:string { pattern="(20[0-9]{2})(:U\+[23]?[0-9A-F]{4})?" }+ } }?
+
+  code-point-attributes &amp;= attribute kJis0
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kJis1
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kJIS0213
+    { list { xsd:string { pattern="[12],[0-9]{2},[0-9]{1,2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kJoyoKanji
+    { list { xsd:string { pattern="(20[0-9]{2})|(U\+[23]?[0-9A-F]{4})" }+ } }?
+
+  code-point-attributes &amp;= attribute kKangXi
+    { list { xsd:string { pattern="[0-9]{4}\.[0-9]{2}[01]" }+ } }?
+
+  code-point-attributes &amp;= attribute kKarlgren
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}[A*]?" }+ } }?
+
+  code-point-attributes &amp;= attribute kKorean
+    { list { xsd:string { pattern="[A-Z]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kKoreanEducationHanja
+    { list { xsd:string { pattern="20[0-9]{2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kKoreanName
+    { list { xsd:string { pattern="20[0-9]{2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kLau
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}" }+ } }?
+
+  code-point-attributes &amp;= attribute kMainlandTelegraph
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kMandarin
+    { list { xsd:string { pattern="[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kMatthews
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}(a|\.5)?" }+ } }?
+
+  code-point-attributes &amp;= attribute kMeyerWempe
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}[a-t*]?" }+ } }?
+
+  code-point-attributes &amp;= attribute kMojiJoho
+    { list { xsd:string { pattern="MJ\d{6}(:(FE0[01]|E01[01][0-9A-F]))?" }+ } }?
+
+  code-point-attributes &amp;= attribute kMorohashi
+    { list { xsd:string { pattern="(\d{5}'{0,2}|H\d{3})(:(FE0[01]|E010[0-9A-F]))?" }+ } }?
+
+  code-point-attributes &amp;= attribute kNelson
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kOtherNumeric
+    { list { xsd:string { pattern="[0-9]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kPhonetic
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}[A-D]?\*?" }+ } }?
+
+  code-point-attributes &amp;= attribute kPrimaryNumeric
+    { list { xsd:string { pattern="[0-9]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kPseudoGB1
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kRSAdobe_Japan1_6
+    { list { xsd:string { pattern="[CV]\+[0-9]{1,5}\+[1-9][0-9]{0,2}\.[1-9][0-9]?\.[0-9]{1,2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kRSUnicode
+    { list { xsd:string { pattern="[1-9][0-9]{0,2}'{0,3}\.-?[0-9]{1,2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kSBGY
+    { list { xsd:string { pattern="[0-9]{3}\.[0-7][0-9]" }+ } }?
+
+  code-point-attributes &amp;= attribute kSemanticVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}(&lt;[ks][A-Za-z0-9_]+(:[TBZFJ]+)?(,[ks][A-Za-z0-9_]+(:[TBZFJ]+)?)*)?" }+ } }?
+
+  code-point-attributes &amp;= attribute kSimplifiedVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kSMSZD2003Index
+    { list { xsd:string { pattern="\d{1,3}\.\d{2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kSMSZD2003Readings
+    { list { xsd:string { pattern="[a-z\x{300}\x{301}\x{302}\x{304}\x{308}\x{30C}]+(,[a-z\x{300}\x{301}\x{302}\x{304}\x{308}\x{30C}]+)*\x{7CB5}[a-z]+[1-6]([a-z]+[1-6])?(,[a-z]+[1-6]([a-z]+[1-6])?)*" }+ } }?
+
+  code-point-attributes &amp;= attribute kSpecializedSemanticVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}(&lt;[ks][A-Za-z0-9_]+(:[TBZFJ]+)?(,[ks][A-Za-z0-9_]+(:[TBZFJ]+)?)*)?" }+ } }?
+
+  code-point-attributes &amp;= attribute kSpoofingVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kStrange
+    { list { ( xsd:string { pattern="[ACU]" }
+             | xsd:string { pattern="B:U\+31[0-2AB][0-9A-F]" }
+             | xsd:string { pattern="[FMOR](:U\+[23]?[0-9A-F]{4})?" }
+             | xsd:string { pattern="H:U\+31[3-8][0-9A-F]" }
+             | xsd:string { pattern="I(:U\+[23]?[0-9A-F]{4})*" }
+             | xsd:string { pattern="K(:U\+30[A-F][0-9A-F])+" }
+             | xsd:string { pattern="S:[4-9][0-9]" }
+    )+}}?
+
+  code-point-attributes &amp;= attribute kTaiwanTelegraph
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kTang
+    { list { xsd:string { pattern="\*?[A-Za-z()\x{E6}\x{251}\x{259}\x{25B}\x{300}\x{30C}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kTGH
+    { list { xsd:string { pattern="20[0-9]{2}:[1-9][0-9]{0,3}" }+ } }?
+
+  code-point-attributes &amp;= attribute kTGHZ2013
+    { list { xsd:string { pattern="[0-9]{3}\.[0-9]{3}(,[0-9]{3}\.[0-9]{3})*:[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kTotalStrokes
+    { list { xsd:string { pattern="[1-9][0-9]{0,2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kTraditionalVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kUnihanCore2020
+    { xsd:string { pattern="[GHJKMPT]{1,7}" } }?
+
+  code-point-attributes &amp;= attribute kVietnamese
+    { list { xsd:string { pattern="[A-Za-z\x{110}\x{111}\x{300}-\x{303}\x{306}\x{309}\x{31B}\x{323}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kVietnameseNumeric
+    { list { xsd:string { pattern="\d+" }+ } }?
+
+  code-point-attributes &amp;= attribute kXerox
+    { list { xsd:string { pattern="[0-9]{3}:[0-9]{3}" }+ } }?
+
+  code-point-attributes &amp;= attribute kXHC1983
+    { list { xsd:string { pattern="[0-9]{4}\.[0-9]{3}\*?(,[0-9]{4}\.[0-9]{3}\*?)*:[a-z\x{300}\x{301}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kZhuang
+    { list { xsd:string { pattern="[a-z]+\*?" }+ } }?
+
+  code-point-attributes &amp;= attribute kZhuangNumeric
+    { list { xsd:string { pattern="\d+" }+ } }?
+
+  code-point-attributes &amp;= attribute kZVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}(&lt;[ks][A-Za-z0-9_]+(:[TBZ]+)?(,[ks][A-Za-z0-9_]+(:[TBZ]+)?)*)?" }+ } }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/age.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/age.xml
new file mode 100644
index 000000000..8a1722f22
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/age.xml
@@ -0,0 +1,23 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="age attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute age { "1.1"
+                  | "2.0" | "2.1"
+                  | "3.0" | "3.1" | "3.2"
+                  | "4.0" | "4.1"
+                  | "5.0" | "5.1" | "5.2"
+                  | "6.0" | "6.1" | "6.2" | "6.3"
+                  | "7.0"
+                  | "8.0"
+                  | "9.0"
+                  | "10.0"
+                  | "11.0"
+                  | "12.0" | "12.1"
+                  | "13.0"
+                  | "14.0"
+                  | "15.0" | "15.1"
+                  | "16.0"
+                  | "17.0"
+                  | "unassigned"
+                  }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/bc.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/bc.xml
new file mode 100644
index 000000000..d3e70a6ab
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/bc.xml
@@ -0,0 +1,17 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="bc attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute bc { "AL" | "AN"
+                 | "B" | "BN"
+                 | "CS"
+                 | "EN" | "ES" | "ET"
+                 | "FSI"
+                 | "L" | "LRE" | "LRI" | "LRO"
+                 | "NSM"
+                 | "ON"
+                 | "PDF" | "PDI"
+                 | "R" | "RLE" | "RLI" | "RLO"
+                 | "S"
+                 | "WS"
+                 }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/blk.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/blk.xml
new file mode 100644
index 000000000..ecd721a63
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/blk.xml
@@ -0,0 +1,344 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="blk attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute blk { "Adlam"
+                  | "Aegean_Numbers"
+                  | "Ahom"
+                  | "Alchemical"
+                  | "Alphabetic_PF"
+                  | "Anatolian_Hieroglyphs"
+                  | "Ancient_Greek_Music"
+                  | "Ancient_Greek_Numbers"
+                  | "Ancient_Symbols"
+                  | "Arabic"
+                  | "Arabic_Ext_A"
+                  | "Arabic_Ext_B"
+                  | "Arabic_Ext_C"
+                  | "Arabic_Math"
+                  | "Arabic_PF_A"
+                  | "Arabic_PF_B"
+                  | "Arabic_Sup"
+                  | "Armenian"
+                  | "Arrows"
+                  | "ASCII"
+                  | "Avestan"
+                  | "Balinese"
+                  | "Bamum"
+                  | "Bamum_Sup"
+                  | "Bassa_Vah"
+                  | "Batak"
+                  | "Bengali"
+                  | "Bhaiksuki"
+                  | "Block_Elements"
+                  | "Bopomofo"
+                  | "Bopomofo_Ext"
+                  | "Box_Drawing"
+                  | "Brahmi"
+                  | "Braille"
+                  | "Buginese"
+                  | "Buhid"
+                  | "Byzantine_Music"
+                  | "Carian"
+                  | "Caucasian_Albanian"
+                  | "Chakma"
+                  | "Cham"
+                  | "Cherokee"
+                  | "Cherokee_Sup"
+                  | "Chess_Symbols"
+                  | "Chorasmian"
+                  | "CJK"
+                  | "CJK_Compat"
+                  | "CJK_Compat_Forms"
+                  | "CJK_Compat_Ideographs"
+                  | "CJK_Compat_Ideographs_Sup"
+                  | "CJK_Ext_A"
+                  | "CJK_Ext_B"
+                  | "CJK_Ext_C"
+                  | "CJK_Ext_D"
+                  | "CJK_Ext_E"
+                  | "CJK_Ext_F"
+                  | "CJK_Ext_G"
+                  | "CJK_Ext_H"
+                  | "CJK_Ext_I"
+                  | "CJK_Radicals_Sup"
+                  | "CJK_Strokes"
+                  | "CJK_Symbols"
+                  | "Compat_Jamo"
+                  | "Control_Pictures"
+                  | "Coptic"
+                  | "Coptic_Epact_Numbers"
+                  | "Counting_Rod"
+                  | "Cuneiform"
+                  | "Cuneiform_Numbers"
+                  | "Currency_Symbols"
+                  | "Cypriot_Syllabary"
+                  | "Cypro_Minoan"
+                  | "Cyrillic"
+                  | "Cyrillic_Ext_A"
+                  | "Cyrillic_Ext_B"
+                  | "Cyrillic_Ext_C"
+                  | "Cyrillic_Ext_D"
+                  | "Cyrillic_Sup"
+                  | "Deseret"
+                  | "Devanagari"
+                  | "Devanagari_Ext"
+                  | "Devanagari_Ext_A"
+                  | "Diacriticals"
+                  | "Diacriticals_Ext"
+                  | "Diacriticals_For_Symbols"
+                  | "Diacriticals_Sup"
+                  | "Dingbats"
+                  | "Dives_Akuru"
+                  | "Dogra"
+                  | "Domino"
+                  | "Duployan"
+                  | "Early_Dynastic_Cuneiform"
+                  | "Egyptian_Hieroglyph_Format_Controls"
+                  | "Egyptian_Hieroglyphs"
+                  | "Egyptian_Hieroglyphs_Ext_A"
+                  | "Elbasan"
+                  | "Elymaic"
+                  | "Emoticons"
+                  | "Enclosed_Alphanum"
+                  | "Enclosed_Alphanum_Sup"
+                  | "Enclosed_CJK"
+                  | "Enclosed_Ideographic_Sup"
+                  | "Ethiopic"
+                  | "Ethiopic_Ext"
+                  | "Ethiopic_Ext_A"
+                  | "Ethiopic_Ext_B"
+                  | "Ethiopic_Sup"
+                  | "Garay"
+                  | "Geometric_Shapes"
+                  | "Geometric_Shapes_Ext"
+                  | "Georgian"
+                  | "Georgian_Ext"
+                  | "Georgian_Sup"
+                  | "Glagolitic"
+                  | "Glagolitic_Sup"
+                  | "Gothic"
+                  | "Grantha"
+                  | "Greek"
+                  | "Greek_Ext"
+                  | "Gujarati"
+                  | "Gunjala_Gondi"
+                  | "Gurmukhi"
+                  | "Gurung_Khema"
+                  | "Half_And_Full_Forms"
+                  | "Half_Marks"
+                  | "Hangul"
+                  | "Hanifi_Rohingya"
+                  | "Hanunoo"
+                  | "Hatran"
+                  | "Hebrew"
+                  | "High_PU_Surrogates"
+                  | "High_Surrogates"
+                  | "Hiragana"
+                  | "IDC"
+                  | "Ideographic_Symbols"
+                  | "Imperial_Aramaic"
+                  | "Indic_Number_Forms"
+                  | "Indic_Siyaq_Numbers"
+                  | "Inscriptional_Pahlavi"
+                  | "Inscriptional_Parthian"
+                  | "IPA_Ext"
+                  | "Jamo"
+                  | "Jamo_Ext_A"
+                  | "Jamo_Ext_B"
+                  | "Javanese"
+                  | "Kaithi"
+                  | "Kaktovik_Numerals"
+                  | "Kana_Ext_A"
+                  | "Kana_Ext_B"
+                  | "Kana_Sup"
+                  | "Kanbun"
+                  | "Kangxi"
+                  | "Kannada"
+                  | "Katakana"
+                  | "Katakana_Ext"
+                  | "Kawi"
+                  | "Kayah_Li"
+                  | "Kharoshthi"
+                  | "Khitan_Small_Script"
+                  | "Khmer"
+                  | "Khmer_Symbols"
+                  | "Khojki"
+                  | "Khudawadi"
+                  | "Kirat_Rai"
+                  | "Lao"
+                  | "Latin_1_Sup"
+                  | "Latin_Ext_A"
+                  | "Latin_Ext_Additional"
+                  | "Latin_Ext_B"
+                  | "Latin_Ext_C"
+                  | "Latin_Ext_D"
+                  | "Latin_Ext_E"
+                  | "Latin_Ext_F"
+                  | "Latin_Ext_G"
+                  | "Lepcha"
+                  | "Letterlike_Symbols"
+                  | "Limbu"
+                  | "Linear_A"
+                  | "Linear_B_Ideograms"
+                  | "Linear_B_Syllabary"
+                  | "Lisu"
+                  | "Lisu_Sup"
+                  | "Low_Surrogates"
+                  | "Lycian"
+                  | "Lydian"
+                  | "Mahajani"
+                  | "Mahjong"
+                  | "Makasar"
+                  | "Malayalam"
+                  | "Mandaic"
+                  | "Manichaean"
+                  | "Marchen"
+                  | "Masaram_Gondi"
+                  | "Math_Alphanum"
+                  | "Math_Operators"
+                  | "Mayan_Numerals"
+                  | "Medefaidrin"
+                  | "Meetei_Mayek"
+                  | "Meetei_Mayek_Ext"
+                  | "Mende_Kikakui"
+                  | "Meroitic_Cursive"
+                  | "Meroitic_Hieroglyphs"
+                  | "Miao"
+                  | "Misc_Arrows"
+                  | "Misc_Math_Symbols_A"
+                  | "Misc_Math_Symbols_B"
+                  | "Misc_Pictographs"
+                  | "Misc_Symbols"
+                  | "Misc_Technical"
+                  | "Modi"
+                  | "Modifier_Letters"
+                  | "Modifier_Tone_Letters"
+                  | "Mongolian"
+                  | "Mongolian_Sup"
+                  | "Mro"
+                  | "Multani"
+                  | "Music"
+                  | "Myanmar"
+                  | "Myanmar_Ext_A"
+                  | "Myanmar_Ext_B"
+                  | "Myanmar_Ext_C"
+                  | "Nabataean"
+                  | "Nag_Mundari"
+                  | "Nandinagari"
+                  | "NB"
+                  | "New_Tai_Lue"
+                  | "Newa"
+                  | "NKo"
+                  | "Number_Forms"
+                  | "Nushu"
+                  | "Nyiakeng_Puachue_Hmong"
+                  | "OCR"
+                  | "Ogham"
+                  | "Ol_Chiki"
+                  | "Ol_Onal"
+                  | "Old_Hungarian"
+                  | "Old_Italic"
+                  | "Old_North_Arabian"
+                  | "Old_Permic"
+                  | "Old_Persian"
+                  | "Old_Sogdian"
+                  | "Old_South_Arabian"
+                  | "Old_Turkic"
+                  | "Old_Uyghur"
+                  | "Oriya"
+                  | "Ornamental_Dingbats"
+                  | "Osage"
+                  | "Osmanya"
+                  | "Ottoman_Siyaq_Numbers"
+                  | "Pahawh_Hmong"
+                  | "Palmyrene"
+                  | "Pau_Cin_Hau"
+                  | "Phags_Pa"
+                  | "Phaistos"
+                  | "Phoenician"
+                  | "Phonetic_Ext"
+                  | "Phonetic_Ext_Sup"
+                  | "Playing_Cards"
+                  | "Psalter_Pahlavi"
+                  | "PUA"
+                  | "Punctuation"
+                  | "Rejang"
+                  | "Rumi"
+                  | "Runic"
+                  | "Samaritan"
+                  | "Saurashtra"
+                  | "Sharada"
+                  | "Shavian"
+                  | "Shorthand_Format_Controls"
+                  | "Siddham"
+                  | "Sinhala"
+                  | "Sinhala_Archaic_Numbers"
+                  | "Small_Forms"
+                  | "Small_Kana_Ext"
+                  | "Sogdian"
+                  | "Sora_Sompeng"
+                  | "Soyombo"
+                  | "Specials"
+                  | "Sundanese"
+                  | "Sundanese_Sup"
+                  | "Sunuwar"
+                  | "Sup_Arrows_A"
+                  | "Sup_Arrows_B"
+                  | "Sup_Arrows_C"
+                  | "Sup_Math_Operators"
+                  | "Sup_PUA_A"
+                  | "Sup_PUA_B"
+                  | "Sup_Punctuation"
+                  | "Sup_Symbols_And_Pictographs"
+                  | "Super_And_Sub"
+                  | "Sutton_SignWriting"
+                  | "Syloti_Nagri"
+                  | "Symbols_And_Pictographs_Ext_A"
+                  | "Symbols_For_Legacy_Computing"
+                  | "Symbols_For_Legacy_Computing_Sup"
+                  | "Syriac"
+                  | "Syriac_Sup"
+                  | "Tagalog"
+                  | "Tagbanwa"
+                  | "Tags"
+                  | "Tai_Le"
+                  | "Tai_Tham"
+                  | "Tai_Viet"
+                  | "Tai_Xuan_Jing"
+                  | "Takri"
+                  | "Tamil"
+                  | "Tamil_Sup"
+                  | "Tangsa"
+                  | "Tangut"
+                  | "Tangut_Components"
+                  | "Tangut_Sup"
+                  | "Telugu"
+                  | "Thaana"
+                  | "Thai"
+                  | "Tibetan"
+                  | "Tifinagh"
+                  | "Tirhuta"
+                  | "Todhri"
+                  | "Toto"
+                  | "Transport_And_Map"
+                  | "Tulu_Tigalari"
+                  | "UCAS"
+                  | "UCAS_Ext"
+                  | "UCAS_Ext_A"
+                  | "Ugaritic"
+                  | "Vai"
+                  | "Vedic_Ext"
+                  | "Vertical_Forms"
+                  | "Vithkuqi"
+                  | "VS"
+                  | "VS_Sup"
+                  | "Wancho"
+                  | "Warang_Citi"
+                  | "Yezidi"
+                  | "Yi_Radicals"
+                  | "Yi_Syllables"
+                  | "Yijing"
+                  | "Zanabazar_Square"
+                  | "Znamenny_Music"
+                  }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/block.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/block.xml
new file mode 100644
index 000000000..1d9b2beb8
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/block.xml
@@ -0,0 +1,10 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="blocks" id='schema.block'>
+  ucd.content &amp;=
+    element blocks {
+      element block {
+        attribute first-cp { single-code-point },
+        attribute last-cp { single-code-point },
+        attribute name { text } }+ }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/bmg.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/bmg.xml
new file mode 100644
index 000000000..d4431070d
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/bmg.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="bmg attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute bmg { "" | single-code-point }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/boolean.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/boolean.xml
new file mode 100644
index 000000000..fae36d68d
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/boolean.xml
@@ -0,0 +1,4 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="boolean" id='schema.boolean'>
+  boolean = "Y" | "N"
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/boundaries.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/boundaries.xml
new file mode 100644
index 000000000..abe4ffe9a
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/boundaries.xml
@@ -0,0 +1,58 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="properties related to boundaries" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute Gr_Base { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Gr_Ext { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OGr_Ext { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Gr_Link { boolean }?
+
+  code-point-attributes &amp;=
+    attribute GCB { "CN" | "CR"
+                  | "EB" | "EBG" | "EM" | "EX"
+                  | "GAZ"
+                  | "L" | "LF" | "LV" | "LVT"
+                  | "PP"
+                  | "RI"
+                  | "SM"
+                  | "T"
+                  | "V"
+                  | "XX"
+                  | "ZWJ"
+                  }?
+
+  code-point-attributes &amp;=
+    attribute WB { "CR"
+                 | "DQ"
+                 | "EB" | "EBG" | "EM" | "EX" | "Extend"
+                 | "FO"
+                 | "GAZ"
+                 | "HL"
+                 | "KA"
+                 | "LE" | "LF"
+                 | "MB" | "ML" | "MN"
+                 | "NL" | "NU"
+                 | "RI"
+                 | "SQ"
+                 | "WSegSpace"
+                 | "XX"
+                 | "ZWJ"
+                 }?
+
+  code-point-attributes &amp;=
+    attribute SB { "AT"
+                 | "CL" | "CR"
+                 | "EX"
+                 | "FO"
+                 | "LE" | "LF" | "LO"
+                 | "NU"
+                 | "SC" | "SE" | "SP" | "ST"
+                 | "UP"
+                 | "XX"
+                 }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/bpb.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/bpb.xml
new file mode 100644
index 000000000..3924ed3e9
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/bpb.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="bpb attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute bpb { "#" | single-code-point }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/bpt.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/bpt.xml
new file mode 100644
index 000000000..183c9bf3f
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/bpt.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="bpt attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute bpt { "o" | "c" | "n" }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/case_folding.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/case_folding.xml
new file mode 100644
index 000000000..8708699be
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/case_folding.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="casing properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute scf { "#" | single-code-point }?
+
+  code-point-attributes &amp;=
+    attribute cf { "#" | one-or-more-code-points }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/case_mapping.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/case_mapping.xml
new file mode 100644
index 000000000..c1296b7b9
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/case_mapping.xml
@@ -0,0 +1,11 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="casing properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute uc { "#" | one-or-more-code-points }?
+
+  code-point-attributes &amp;=
+    attribute lc { "#" | one-or-more-code-points }?
+
+  code-point-attributes &amp;=
+    attribute tc { "#" | one-or-more-code-points }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/case_other.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/case_other.xml
new file mode 100644
index 000000000..df4b97e64
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/case_other.xml
@@ -0,0 +1,32 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="casing properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute CI { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Cased { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWCF { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWCM { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWL { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWKCF { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWT { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWU { boolean }?
+
+  code-point-attributes &amp;=
+    attribute NFKC_CF { "#" | zero-or-more-code-points }?
+
+  code-point-attributes &amp;=
+    attribute NFKC_SCF { "#" | zero-or-more-code-points }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/casing.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/casing.xml
new file mode 100644
index 000000000..503f05999
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/casing.xml
@@ -0,0 +1,14 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="casing properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute Upper { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Lower { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OUpper { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OLower { boolean }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/ccc.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/ccc.xml
new file mode 100644
index 000000000..8226509d7
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/ccc.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="ccc attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute ccc { xsd:integer { minInclusive="0" maxInclusive="254" } }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/cjk-radicals.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/cjk-radicals.xml
new file mode 100644
index 000000000..45c49ed2c
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/cjk-radicals.xml
@@ -0,0 +1,10 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="cjk radicals" id='schema.cjk-radicals'>
+  ucd.content &amp;=
+    element cjk-radicals {
+      element cjk-radical {
+        attribute number { xsd:string {pattern="[0-9]{1,3}'{0,3}"}},
+        attribute radical { single-code-point? },
+        attribute ideograph { single-code-point } }+ }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/cjkEACC.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/cjkEACC.xml
new file mode 100644
index 000000000..08222c4f0
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/cjkEACC.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="cjkEACC attribute" id='schema.properties'>
+  code-point-attributes &amp;= attribute cjkEACC
+ { xsd:string { pattern="[0-9A-F]{6}" } }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/cjkIRG_TSource.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/cjkIRG_TSource.xml
new file mode 100644
index 000000000..49f9c3917
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/cjkIRG_TSource.xml
@@ -0,0 +1,6 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="cjkIRG_TSource attribute" id='schema.properties'>
+  code-point-attributes &amp;= attribute cjkIRG_TSource
+ { xsd:string { pattern="T([1-7A-F]|1[1-3])-[0-9A-F]{4}
+| TU-[023][0-9A-F]{4}" } }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/composition.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/composition.xml
new file mode 100644
index 000000000..96ce4abcf
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/composition.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="composition properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute CE { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Comp_Ex { boolean }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/datatypes.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/datatypes.xml
new file mode 100644
index 000000000..c26367d97
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/datatypes.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="datatypes declaration" id='schema.datatypes'>
+  # default; datatypes xsd = "http://www.w3.org/2001/XMLSchema-datatypes"
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/datatypes_code_points.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/datatypes_code_points.xml
new file mode 100644
index 000000000..c3cda88df
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/datatypes_code_points.xml
@@ -0,0 +1,9 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="datatype for code points" id='schema.datatypes'>
+  single-code-point = xsd:string { pattern = "(|[1-9A-F]|(10))[0-9A-F]{4}" }
+
+  one-or-more-code-points = list { single-code-point + }
+  zero-or-more-code-points = list { single-code-point * }
+  two-code-points = list { single-code-point, single-code-point }
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/decomposition.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/decomposition.xml
new file mode 100644
index 000000000..833a7d1e0
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/decomposition.xml
@@ -0,0 +1,11 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="decomposition properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute dt { "can" | "com" | "enc" | "fin" | "font" | "fra"
+                 | "init" | "iso" | "med" | "nar" | "nb" | "sml"
+                 | "sqr" | "sub" | "sup" | "vert" | "wide" | "none"
+                 }?
+
+  code-point-attributes &amp;=
+    attribute dm { "#" | zero-or-more-code-points }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/description.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/description.xml
new file mode 100644
index 000000000..97bb063e7
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/description.xml
@@ -0,0 +1,6 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="description" id='schema.description'>
+  ucd.content &amp;=
+    element description { text }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/do-not-emit.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/do-not-emit.xml
new file mode 100644
index 000000000..5381491e7
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/do-not-emit.xml
@@ -0,0 +1,22 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="do-not-emit" id='schema.do-not-emit'>
+  ucd.content &amp;=
+    element do-not-emit {
+      element instead {
+        attribute of { one-or-more-code-points },
+        attribute use { one-or-more-code-points },
+        attribute because { "Bengali_Khanda_Ta"
+                          | "Deprecated"
+                          | "Discouraged"
+                          | "Dotless_Form"
+                          | "Hamza_Form"
+                          | "Indic_Atomic_Consonant"
+                          | "Indic_Consonant_Conjunct"
+                          | "Indic_Vowel_Letter"
+                          | "Malayalam_Chillu"
+                          | "Precomposed_Form"
+                          | "Precomposed_Hieroglyph"
+                          | "Preferred_Spelling"
+                          | "Tamil_Shrii"
+      } }+ }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/ea.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/ea.xml
new file mode 100644
index 000000000..d51bf2441
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/ea.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="ea attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute ea { "A" | "F" | "H" | "N" | "Na" | "W" }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/emoji-sources.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/emoji-sources.xml
new file mode 100644
index 000000000..96d122953
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/emoji-sources.xml
@@ -0,0 +1,11 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="emoji sources" id='schema.emoji-sources'>
+  ucd.content &amp;=
+    element emoji-sources {
+      element emoji-source {
+        attribute unicode { one-or-more-code-points },
+        attribute docomo { jis-code-point? },
+        attribute kddi { jis-code-point? },
+        attribute softbank { jis-code-point? } }+ }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/function_graphic.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/function_graphic.xml
new file mode 100644
index 000000000..7ce510adc
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/function_graphic.xml
@@ -0,0 +1,68 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="properties related to function and graphic characteristics" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute Dash { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Hyphen { boolean }?
+
+  code-point-attributes &amp;=
+    attribute QMark { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Term { boolean }?
+
+  code-point-attributes &amp;=
+    attribute STerm { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Dia { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Ext { boolean }?
+
+  code-point-attributes &amp;=
+    attribute SD { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Alpha { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OAlpha { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Math { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OMath { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Hex { boolean }?
+
+  code-point-attributes &amp;=
+    attribute AHex { boolean }?
+
+  code-point-attributes &amp;=
+    attribute DI { boolean }?
+
+  code-point-attributes &amp;=
+    attribute ODI { boolean }?
+
+  code-point-attributes &amp;=
+    attribute LOE { boolean }?
+
+  code-point-attributes &amp;=
+    attribute PCM { boolean }?
+
+  code-point-attributes &amp;=
+    attribute MCM { boolean }?
+
+  code-point-attributes &amp;=
+    attribute WSpace { boolean }?
+
+  code-point-attributes &amp;=
+    attribute vo { "R" | "Tr" | "Tu" | "U" }?
+
+  code-point-attributes &amp;=
+    attribute RI { boolean }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/gc.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/gc.xml
new file mode 100644
index 000000000..36cd1f774
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/gc.xml
@@ -0,0 +1,12 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="gc attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute gc { "Cc" | "Cf" | "Cn" | "Co" | "Cs"
+                 | "Ll" | "Lm" | "Lo" | "Lt" | "Lu"
+                 | "Mc" | "Me" | "Mn"
+                 | "Nd" | "Nl" | "No"
+                 | "Pc" | "Pd" | "Pe" | "Pf" | "Pi" | "Po" | "Ps"
+                 | "Sc" | "Sk" | "Sm" | "So"
+                 | "Zl" | "Zp" | "Zs"
+                 }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/groups.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/groups.xml
new file mode 100644
index 000000000..11f3b0dd9
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/groups.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="groups" id='schema.repertoire'>
+  group =
+    element group {
+      code-point-attributes,
+      code-point* }
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/hst.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/hst.xml
new file mode 100644
index 000000000..385cd466a
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/hst.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="hst attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute hst { "L" | "LV" | "LVT" | "NA" | "T" | "V" }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/identifier.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/identifier.xml
new file mode 100644
index 000000000..0ab95a27f
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/identifier.xml
@@ -0,0 +1,26 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="identifier properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute IDS { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OIDS { boolean }?
+
+  code-point-attributes &amp;=
+    attribute XIDS { boolean }?
+
+  code-point-attributes &amp;=
+    attribute IDC { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OIDC { boolean }?
+
+  code-point-attributes &amp;=
+    attribute XIDC { boolean }?
+
+  code-point-attributes &amp;=
+    attribute ID_Compat_Math_Start { boolean }?
+
+  code-point-attributes &amp;=
+    attribute ID_Compat_Math_Continue { boolean }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/ideographs.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/ideographs.xml
new file mode 100644
index 000000000..0c758e342
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/ideographs.xml
@@ -0,0 +1,23 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="properties related to ideographs" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute Ideo { boolean }?
+
+  code-point-attributes &amp;=
+    attribute UIdeo { boolean }?
+
+  code-point-attributes &amp;=
+    attribute EqUIdeo { single-code-point }?
+
+  code-point-attributes &amp;=
+    attribute IDSB { boolean }?
+
+  code-point-attributes &amp;=
+    attribute IDST { boolean }?
+
+  code-point-attributes &amp;=
+    attribute IDSU { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Radical { boolean }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/isc.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/isc.xml
new file mode 100644
index 000000000..f19b59317
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/isc.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="isc attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute isc { text }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/jis-code-point.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/jis-code-point.xml
new file mode 100644
index 000000000..9a6820c7b
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/jis-code-point.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="datatype for code points" id='schema.datatypes'>
+  jis-code-point = xsd:string { pattern = "[0-9A-F]{4}" }
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/joining.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/joining.xml
new file mode 100644
index 000000000..184fcca14
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/joining.xml
@@ -0,0 +1,53 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="joining properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute jt { "C" | "D" | "L" | "R" | "T" | "U" }?
+
+  code-point-attributes &amp;=
+    attribute jg { "African_Feh" | "African_Noon" | "African_Qaf"
+                 | "Ain" | "Alaph" | "Alef"
+                 | "Beh" | "Beth" | "Burushaski_Yeh_Barree"
+                 | "Dal" | "Dalath_Rish"
+                 | "E"
+                 | "Farsi_Yeh" | "Fe" | "Feh" | "Final_Semkath"
+                 | "Gaf" | "Gamal"
+                 | "Hah" | "Hanifi_Rohingya_Kinna_Ya"
+                 | "Hanifi_Rohingya_Pa" | "He" | "Heh" | "Heh_Goal"
+                 | "Heth"
+                 | "Kaf" | "Kaph" | "Kashmiri_Yeh" | "Khaph"
+                 | "Knotted_Heh"
+                 | "Lam" | "Lamadh"
+                 | "Malayalam_Bha" | "Malayalam_Ja" | "Malayalam_Lla"
+                 | "Malayalam_Llla" | "Malayalam_Nga"
+                 | "Malayalam_Nna" | "Malayalam_Nnna"
+                 | "Malayalam_Nya" | "Malayalam_Ra" | "Malayalam_Ssa"
+                 | "Malayalam_Tta" | "Manichaean_Aleph"
+                 | "Manichaean_Ayin" | "Manichaean_Beth"
+                 | "Manichaean_Daleth" | "Manichaean_Dhamedh"
+                 | "Manichaean_Five" | "Manichaean_Gimel"
+                 | "Manichaean_Heth" | "Manichaean_Hundred"
+                 | "Manichaean_Kaph" | "Manichaean_Lamedh"
+                 | "Manichaean_Mem" | "Manichaean_Nun"
+                 | "Manichaean_One" | "Manichaean_Pe"
+                 | "Manichaean_Qoph" | "Manichaean_Resh"
+                 | "Manichaean_Sadhe" | "Manichaean_Samekh"
+                 | "Manichaean_Taw" | "Manichaean_Ten"
+                 | "Manichaean_Teth" | "Manichaean_Thamedh"
+                 | "Manichaean_Twenty" | "Manichaean_Waw"
+                 | "Manichaean_Yodh" | "Manichaean_Zayin" | "Meem"
+                 | "Mim"
+                 | "No_Joining_Group" | "Noon" | "Nun" | "Nya"
+                 | "Pe"
+                 | "Qaf" | "Qaph"
+                 | "Reh" | "Reversed_Pe" | "Rohingya_Yeh"
+                 | "Sad" | "Sadhe" | "Seen" | "Semkath" | "Shin"
+                 | "Straight_Waw" | "Swash_Kaf" | "Syriac_Waw"
+                 | "Tah" | "Taw" | "Teh_Marbuta" | "Teh_Marbuta_Goal"
+                 | "Teth" | "Thin_Yeh"
+                 | "Vertical_Tail"
+                 | "Waw"
+                 | "Yeh" | "Yeh_Barree" | "Yeh_With_Tail" | "Yudh"
+                 | "Yudh_He"
+                 | "Zain" | "Zhain"
+                 }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/lb.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/lb.xml
new file mode 100644
index 000000000..ee1f36cac
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/lb.xml
@@ -0,0 +1,24 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="lb attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute lb { "AI" | "AK" | "AL" | "AP" | "AS"
+                 | "B2" | "BA" | "BB" | "BK"
+                 | "CB" | "CJ" | "CL" | "CM" | "CP" | "CR"
+                 | "EB" | "EM" | "EX"
+                 | "GL"
+                 | "H2" | "H3" | "HL" | "HY"
+                 | "ID" | "IN" | "IS"
+                 | "JL" | "JT" | "JV"
+                 | "LF"
+                 | "NL" | "NS" | "NU"
+                 | "OP"
+                 | "PO" | "PR"
+                 | "QU"
+                 | "RI"
+                 | "SA" | "SG" | "SP" | "SY"
+                 | "VF" | "VI"
+                 | "WJ"
+                 | "XX"
+                 | "ZW" | "ZWJ"
+                 }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/miscellaneous.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/miscellaneous.xml
new file mode 100644
index 000000000..5dafe8c22
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/miscellaneous.xml
@@ -0,0 +1,11 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="miscellaneous properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute Dep { boolean }?
+
+  code-point-attributes &amp;=
+    attribute VS { boolean }?
+
+  code-point-attributes &amp;=
+    attribute NChar { boolean }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/na.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/na.xml
new file mode 100644
index 000000000..4c4644c31
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/na.xml
@@ -0,0 +1,13 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="na attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute na { "" |
+                   "CJK UNIFIED IDEOGRAPH-#" |
+                   "CJK COMPATIBILITY IDEOGRAPH-#" |
+                   "EGYPTIAN HIEROGLYPH-#" |
+                   "TANGUT IDEOGRAPH-#" |
+                   "KHITAN SMALL SCRIPT CHARACTER-#" |
+                   "NUSHU CHARACTER-#" |
+                   xsd:string { pattern="[a-zA-Z0-9]+(( -|- |[\-_ ])[a-zA-Z0-9]+)*" }
+                 }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/na1.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/na1.xml
new file mode 100644
index 000000000..592de98c3
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/na1.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="na1 attribute" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute na1 { "" | xsd:string { pattern="[a-zA-Z0-9]+([\-_ ][a-zA-Z0-9]+)*( \(.*\))?" } }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/named-sequences.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/named-sequences.xml
new file mode 100644
index 000000000..2859ea29d
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/named-sequences.xml
@@ -0,0 +1,15 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="named sequences" id='schema.named-sequences'>
+  ucd.content &amp;=
+    element named-sequences {
+      element named-sequence {
+        attribute cps { one-or-more-code-points },
+        attribute name { text } }+ }?
+
+  ucd.content &amp;=
+    element provisional-named-sequences {
+      element named-sequence {
+        attribute cps { one-or-more-code-points },
+        attribute name { text } }+ }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/namespace.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/namespace.xml
new file mode 100644
index 000000000..e75306a26
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/namespace.xml
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="namespace declaration" id='schema.namespace'>
+  default namespace ucd = "http://www.unicode.org/ns/2003/ucd/1.0"
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/normalization-corrections.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/normalization-corrections.xml
new file mode 100644
index 000000000..7231a8c26
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/normalization-corrections.xml
@@ -0,0 +1,11 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="normalization corrections" id='schema.normalization-corrections'>
+  ucd.content &amp;=
+    element normalization-corrections {
+      element normalization-correction {
+        attribute cp { single-code-point },
+        attribute old { one-or-more-code-points },
+        attribute new { one-or-more-code-points },
+        attribute version { text } }+ }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/numeric.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/numeric.xml
new file mode 100644
index 000000000..24230aee1
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/numeric.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="numeric properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute nt { "De" | "Di" | "Nu" | "None" }?
+
+  code-point-attributes &amp;=
+    attribute nv { "NaN" | xsd:string { pattern="-?[0-9]+(/[0-9]+)?" } }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/pattern.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/pattern.xml
new file mode 100644
index 000000000..baa00a73c
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/pattern.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="pattern properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute Pat_Syn { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Pat_WS { boolean }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/quickcheck.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/quickcheck.xml
new file mode 100644
index 000000000..224c2287e
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/quickcheck.xml
@@ -0,0 +1,31 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="quick check properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute NFC_QC { "Y" | "N" | "M" }?
+
+  code-point-attributes &amp;=
+    attribute NFD_QC { "Y" | "N" }?
+
+  code-point-attributes &amp;=
+    attribute NFKC_QC { "Y" | "N" | "M" }?
+
+  code-point-attributes &amp;=
+    attribute NFKD_QC { "Y" | "N" }?
+
+
+  code-point-attributes &amp;=
+    attribute XO_NFC { boolean }?
+
+  code-point-attributes &amp;=
+    attribute XO_NFD { boolean }?
+
+  code-point-attributes &amp;=
+    attribute XO_NFKC { boolean }?
+
+  code-point-attributes &amp;=
+    attribute XO_NFKD { boolean }?
+
+
+  code-point-attributes &amp;=
+    attribute FC_NFKC { "#" | one-or-more-code-points }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/repertoire.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/repertoire.xml
new file mode 100644
index 000000000..0cfc86e40
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/repertoire.xml
@@ -0,0 +1,6 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="repertoire" id='schema.repertoire'>
+  ucd.content &amp;=
+    element repertoire { (code-point | group) + }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/repertoire_Code_points.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/repertoire_Code_points.xml
new file mode 100644
index 000000000..cdfd1ad88
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/repertoire_Code_points.xml
@@ -0,0 +1,23 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="Code points" id='schema.repertoire'>
+  code-point |=
+    element reserved {
+      set-of-code-points,
+      code-point-attributes }
+
+  code-point |=
+    element noncharacter {
+      set-of-code-points,
+      code-point-attributes }
+
+  code-point |=
+    element surrogate {
+      set-of-code-points,
+      code-point-attributes }
+
+  code-point |=
+    element char {
+      set-of-code-points,
+      code-point-attributes }
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/script.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/script.xml
new file mode 100644
index 000000000..b22243aaf
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/script.xml
@@ -0,0 +1,49 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="script properties" id='schema.properties'>
+  script = "Adlm" | "Aghb" | "Ahom" | "Arab" | "Armi" | "Armn"
+           | "Avst"
+           | "Bali" | "Bamu" | "Bass" | "Batk" | "Beng" | "Bhks"
+           | "Bopo" | "Brah" | "Brai" | "Bugi" | "Buhd"
+           | "Cakm" | "Cans" | "Cari" | "Cham" | "Cher" | "Chrs"
+           | "Copt" | "Cpmn" | "Cprt" | "Cyrl"
+           | "Deva" | "Diak" | "Dogr" | "Dsrt" | "Dupl"
+           | "Egyp" | "Elba" | "Elym" | "Ethi"
+           | "Gara" | "Geor" | "Glag" | "Gong" | "Gonm" | "Goth"
+           | "Gran" | "Grek" | "Gujr" | "Gukh" | "Guru"
+           | "Hang" | "Hani" | "Hano" | "Hatr" | "Hebr" | "Hira"
+           | "Hluw" | "Hmng" | "Hmnp" | "Hrkt" | "Hung"
+           | "Ital"
+           | "Java"
+           | "Kali" | "Kana" | "Kawi" | "Khar" | "Khmr" | "Khoj"
+           | "Kits" | "Knda" | "Krai" | "Kthi"
+           | "Lana" | "Laoo" | "Latn" | "Lepc" | "Limb" | "Lina"
+           | "Linb" | "Lisu" | "Lyci" | "Lydi"
+           | "Mahj" | "Maka" | "Mand" | "Mani" | "Marc" | "Medf"
+           | "Mend" | "Merc" | "Mero" | "Mlym" | "Modi" | "Mong"
+           | "Mroo" | "Mtei" | "Mult" | "Mymr"
+           | "Nagm" | "Nand" | "Narb" | "Nbat" | "Newa" | "Nkoo"
+           | "Nshu"
+           | "Ogam" | "Olck" | "Onao" | "Orkh" | "Orya" | "Osge"
+           | "Osma" | "Ougr"
+           | "Palm" | "Pauc" | "Perm" | "Phag" | "Phli" | "Phlp"
+           | "Phnx" | "Plrd" | "Prti"
+           | "Rjng" | "Rohg" | "Runr"
+           | "Samr" | "Sarb" | "Saur" | "Sgnw" | "Shaw" | "Shrd"
+           | "Sidd" | "Sind" | "Sinh" | "Sogd" | "Sogo" | "Sora"
+           | "Soyo" | "Sund" | "Sunu" | "Sylo" | "Syrc"
+           | "Tagb" | "Takr" | "Tale" | "Talu" | "Taml" | "Tang"
+           | "Tavt" | "Telu" | "Tfng" | "Tglg" | "Thaa" | "Thai"
+           | "Tibt" | "Tirh" | "Tnsa" | "Todr" | "Toto" | "Tutg"
+           | "Ugar"
+           | "Vaii" | "Vith"
+           | "Wara" | "Wcho"
+           | "Xpeo" | "Xsux"
+           | "Yezi" | "Yiii"
+           | "Zanb" | "Zinh" | "Zyyy" | "Zzzz"
+
+  code-point-attributes &amp;=
+    attribute sc { script }?
+
+  code-point-attributes &amp;=
+    attribute scx { list { script + } }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/simple_case_mapping.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/simple_case_mapping.xml
new file mode 100644
index 000000000..e2acb669c
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/simple_case_mapping.xml
@@ -0,0 +1,11 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="casing properties" id='schema.properties'>
+  code-point-attributes &amp;=
+    attribute suc { "#" | single-code-point }?
+
+  code-point-attributes &amp;=
+    attribute slc { "#" | single-code-point }?
+
+  code-point-attributes &amp;=
+    attribute stc { "#" | single-code-point }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/standardized-variants.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/standardized-variants.xml
new file mode 100644
index 000000000..a415a1152
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/standardized-variants.xml
@@ -0,0 +1,10 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="standardized variants" id='schema.standardized-variants'>
+  ucd.content &amp;=
+    element standardized-variants {
+      element standardized-variant {
+        attribute cps { two-code-points },
+        attribute desc { text },
+        attribute when { text } }+ }?
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/fragments/start.xml b/unicodetools/src/main/resources/org/unicode/uax42/fragments/start.xml
new file mode 100644
index 000000000..ba0e2262f
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/fragments/start.xml
@@ -0,0 +1,6 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--Manual-->
+<ucdxml:block xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml" title="schema start" id='schema.start'>
+  start =
+    element ucd { ucd.content }
+</ucdxml:block>
\ No newline at end of file
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/index.xml b/unicodetools/src/main/resources/org/unicode/uax42/index.xml
new file mode 100644
index 000000000..c0f05f5c2
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/index.xml
@@ -0,0 +1,1353 @@
+<?xml version='1.0' encoding='UTF-8'?>
+
+<article xmlns:unicode="http://unicode.org/ns/2001"
+         xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml"
+         xmlns:xi="http://www.w3.org/2001/XInclude"
+>
+
+    <title>Unicode Character Database in XML</title>
+
+    <articleinfo>
+        <unicode:tr number='42' class='uax' version='16.0.0'
+                    stage='proposed-update'
+                    schema='rnc' prevrev='34'/>
+        <copyright>
+            <year>2025</year>
+        </copyright>
+        <authors>
+            <author>
+                <surname>Wilcock</surname>
+                <firstname>John</firstname>
+            </author>
+        </authors>
+        <revhistory>
+            <revision revnumber="36" date="2024-09-02">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>16.0</val>.
+                    </change>
+                    <change>New values for the <attr>blk</attr> attribute: <val>Egyptian_Hieroglyphs_Ext_A</val>, <val>
+                        Garay</val>, <val>Gurung_Khema</val>, <val>Kirat_Rai</val>, <val>Myanmar_Ext_C</val>, <val>
+                        Ol_Onal</val>, <val>Sunuwar</val>, <val>Symbols_for_Legacy_Computing_Sup</val>, <val>
+                        Todhri</val>, <val>Tulu_Tigalari</val>.
+                    </change>
+                    <change>New values for the <attr>script</attr> attribute: <val>Gara</val>, <val>Gukh</val>, <val>
+                        Krai</val>, <val>Onao</val>, <val>Sunu</val>, <val>Todr</val>, <val>Tutg</val>.
+                    </change>
+                    <change>New value for the <attr>jg</attr> attribute: <val>Kashmiri_Yeh</val>.</change>
+                    <change>New value for the <attr>InSC</attr> attribute: <val>Reordering_Killer</val>.
+                    </change>
+                    <change>New attributes: <attr>MCM</attr>, <attr>kFanqie</attr>, <attr>kZhuang</attr>.
+                    </change>
+                    <change>Modified patterns for the <attr>cjk-radical/@number</attr>, <attr>kRSUnicode</attr> and <attr>
+                        kIRG_GSource
+                    </attr> attributes.
+                    </change>
+                    <change>Added the <elem>do-not-emit</elem> element.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 35 being a proposed update, only changes between revisions 34 and 36 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="34" date="2023-08-27">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>15.1</val>.
+                    </change>
+                    <change>New value for the <attr>blk</attr> attribute: <val>CJK_Ext_I</val>.
+                    </change>
+                    <change>New values for the <attr>lb</attr> attribute: <val>AK</val>, <val>AP</val>, <val>
+                        AS</val>, <val>VF</val>, <val>VI</val>.
+                    </change>
+                    <change>Modified values for the <attr>number</attr>, <attr>radical</attr> attributes of the <elem>
+                        cjk-radical
+                    </elem> element.
+                    </change>
+                    <change>Changed single value into list for the <attr>nv</attr> code point attribute.
+                    </change>
+                    <change>New code point attributes: <attr>ID_Compat_Math_Continue</attr>, <attr>
+                        ID_Compat_Math_Start</attr>, <attr>IDSU</attr>, <attr>NFKC_SCF</attr>, <attr>InCB</attr>.
+                    </change>
+                    <change>Modified patterns for the <attr>kBigFive</attr>, <attr>kIRG_GSource</attr>, <attr>
+                        kMorohashi</attr>, <attr>kRSUnicode</attr> attributes.
+                    </change>
+                    <change>Changed single values into lists for the <attr>kMorohashi</attr>, <attr>kPrimaryNumeric
+                    </attr> Unihan attributes.
+                    </change>
+                    <change>New Unihan attributes: <attr>kJapanese</attr>, <attr>kMojiJoho</attr>, <attr>
+                        kSMSZD2003Index</attr>, <attr>kSMSZD2003Readings</attr>, <attr>kVietnameseNumeric</attr>, <attr>
+                        kZhuangNumeric</attr>.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 33 being a proposed update, only changes between revisions 32 and 34 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="32" date="2022-09-04">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>15.0</val>.
+                    </change>
+                    <change>New values for the <attr>blk</attr> attribute: <val>Arabic_Ext_C</val>, <val>CJK_Ext_H</val>, <val>
+                        Cyrillic_Ext_D</val>, <val>Devanagari_Ext_A</val>, <val>Kaktovik_Numerals</val>, <val>Kawi</val>, <val>
+                        Nag_Mundari</val>.
+                    </change>
+                    <change>New values for the <attr>script</attr> attribute: <val>Kawi</val>, <val>Nagm</val>.
+                    </change>
+                    <change>New Unihan attribute: <val>kAlternateTotalStrokes</val>.
+                    </change>
+                    <change>Modified patterns for the <attr>kIRG_GSource</attr>, <attr>kIRG_HSource</attr>, <attr>
+                        kIRG_TSource</attr>, <attr>kSemanticVariant</attr>, <attr>kSpecializedSemanticVariant</attr>, <attr>
+                        kZVariant
+                    </attr> attributes.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 31 being a proposed update, only changes between revisions 30 and 32 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="30" date="2021-08-12">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>14.0</val>.
+                    </change>
+                    <change>New values for the <attr>blk</attr> attribute: <val>Arabic_Ext_B</val>, <val>
+                        Cypro_Minoan</val>, <val>Ethiopic_Ext_B</val>, <val>Kana_Ext_B</val>, <val>
+                        Latin_Ext_F</val>, <val>Latin_Ext_G</val>, <val>Old_Uyghur</val>, <val>Tangsa</val>, <val>
+                        Toto</val>, <val>UCAS_Ext_A</val>, <val>Vithkuqi</val>, <val>Znamenny_Music</val>.
+                    </change>
+                    <change>New values for the <attr>script</attr> attribute: <val>Cpmn</val>, <val>Ougr</val>, <val>
+                        Tnsa</val>, <val>Toto</val>, <val>Vith</val>.
+                    </change>
+                    <change>New values for the <attr>jg</attr> attribute: <val>Thin_Yeh</val>, <val>Vertical_Tail</val>.
+                    </change>
+                    <change>New Unihan attribute: <val>kStrange</val>.
+                    </change>
+                    <change>Modified patterns for the <attr>kIRG_GSource</attr>, <attr>kIRG_MSource</attr>, <attr>
+                        kIRG_VSource</attr>, <attr>kPhonetic</attr>, <attr>kSpoofingVariant</attr> attributes.
+                    </change>
+                    <change>Removal of the <attr>kWubi</attr> attribute, which has never been present in
+                        released versions of the UCD.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 29 being a proposed update, only changes between revisions 28 and 30 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="28" date="2020-02-21">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>13.0</val>.
+                    </change>
+                    <change>New values for the <attr>blk</attr> attribute: <val>Chorasmian</val>, <val>CJK_Ext_G</val>, <val>
+                        Dives_Akuru</val>, <val>Khitan_Small_Script</val>, <val>Lisu_Sup</val>, <val>
+                        Symbols_For_Legacy_Computing</val>, <val>Tangut_Sup</val>, <val>Yezidi</val>.
+                    </change>
+                    <change>New values for the <attr>script</attr> attribute: <val>Chrs</val>, <val>Diak</val>, <val>
+                        Kits</val>, <val>Yezi</val>.
+                    </change>
+                    <change>New value for the <attr>InPC</attr> attribute: <val>Top_And_Bottom_And_Left</val>.
+                    </change>
+                    <change>New Unihan attributes <attr>kSpoofingVariant</attr>, <attr>kUnihanCore2020</attr>, <attr>
+                        kIRG_SSource</attr>, <attr>kIRG_UKSource</attr>, <attr>kTGHZ2013</attr>.
+                    </change>
+                    <change>New Emoji attributes <attr>Emoji</attr>, <attr>EPres</attr>, <attr>EMod</attr>, <attr>
+                        EBase</attr>, <attr>EComp</attr>, <attr>ExtPict</attr>.
+                    </change>
+                    <change>Modified patterns for the <attr>kIRG_GSource</attr>, <attr>kIRG_HSource</attr>, <attr>
+                        kIRG_KPSource</attr>, <attr>kIRG_KSource</attr>, <attr>kIRG_TSource</attr>, <attr>kKangXi</attr>, <attr>
+                        kSemanticVariant</attr>, <attr>kSimplifiedVariant</attr>, <attr>
+                        kSpecializedSemanticVariant</attr>, <attr>kTraditionalVariant</attr> attributes.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 27 being a proposed update, only changes between revisions 26 and 28 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="26" date="2019-05-06">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>12.1</val>.
+                    </change>
+                </changes>
+            </revision>
+            <revision revnumber="25" date="2019-02-18">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>12.0</val>.
+                    </change>
+                    <change>New values for the <attr>script</attr> attribute: <val>Elym</val>, <val>Hmnp</val>, <val>
+                        Nand</val>, <val>Wcho</val>.
+                    </change>
+                    <change>New values for the <attr>blk</attr> attribute: <val>
+                        Egyptian_Hieroglyph_Format_Controls</val>, <val>Elymaic</val>, <val>Nandinagari</val>, <val>
+                        Nyiakeng_Puachue_Hmong</val>, <val>Ottoman_Siyaq_Numbers</val>, <val>Small_Kana_Ext</val>, <val>
+                        Symbols_And_Pictographs_Ext_A</val>, <val>Tamil_Sup</val>, <val>Wancho</val>.
+                    </change>
+                    <change>Modified patterns for the <attr>kIRG_GSource</attr>, <attr>kIRG_KSource</attr>, <attr>
+                        kIRG_TSource</attr>, <attr>kTaiwanTelegraph</attr> attributes.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 24 being a proposed update, only changes between revisions 23 and 25 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="23" date="2018-05-31">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>11.0</val>.
+                    </change>
+                    <change>New values for the <attr>blk</attr> attribute: <val>Chess_Symbols</val>, <val>
+                        Dogra</val>, <val>Georgian_Ext</val>, <val>Gunjala_Gondi</val>, <val>
+                        Hanifi_Rohingya</val>, <val>Indic_Siyaq_Numbers</val>, <val>Makasar</val>, <val>
+                        Mayan_Numerals</val>, <val>Medefaidrin</val>, <val>Old_Sogdian</val>, <val>Sogdian</val>.
+                    </change>
+                    <change>New values for the <attr>script</attr> attribute: <val>Dogr</val>, <val>Gong</val>, <val>
+                        Maka</val>, <val>Medf</val>, <val>Rohg</val>, <val>Sogd</val>, <val>Sogo</val>.
+                    </change>
+                    <change>New values for the <attr>jg</attr> attribute: <val>Hanifi_Rohingya_Kinna_Ya</val>, <val>
+                        Hanifi_Rohingya_Pa</val>.
+                    </change>
+                    <change>New value for the <attr>wb</attr> attribute: <val>WSegSpace</val>.
+                    </change>
+                    <change>New values for the <attr>InSC</attr> attribute: <val>Consonant_Initial_Postfixed</val>.
+                    </change>
+                    <change>New attributes: <attr>EqUIdeo</attr>, <attr>kJinmeiyoKanji</attr>, <attr>kJoyoKanji</attr>, <attr>
+                        kKoreanEducationHanja</attr>, <attr>kKoreanName</attr>, <attr>kTGH</attr>.
+                    </change>
+                    <change>Modified patterns for the <attr>kTGT_MergedSrc</attr> attribute.
+                    </change>
+                    <change>Modified patterns for the <attr>kIRG_GSource</attr>, <attr>kIRG_HSource</attr> and <attr>
+                        kIRG_VSource
+                    </attr> attributes.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 22 being a proposed update, only changes between revisions 21 and 23 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="21" date="2017-06-17">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>10.0</val>.
+                    </change>
+                    <change>New values for the <attr>blk</attr> attribute: <val>CJK_Ext_F</val>, <val>Kana_Ext_A</val>, <val>
+                        Masaram_Gondi</val>, <val>Nushu</val>, <val>Soyombo</val>, <val>Syriac_Sup</val>, <val>
+                        Zanabazar_Square</val>.
+                    </change>
+                    <change>New values for the <attr>sc</attr> attribute: <val>Gonm</val>, <val>Nshu</val>, <val>
+                        Soyo</val>, <val>Zanb</val>.
+                    </change>
+                    <change>New values for the <attr>jg</attr> attribute: <val>Malayalam_Nga</val>, <val>
+                        Malayalam_Ja</val>, <val>Malayalam_Nya</val>, <val>Malayalam_Tta</val>, <val>Malayalam_Nna</val>, <val>
+                        Malayalam_Nnna</val>, <val>Malayalam_Bha</val>, <val>Malayalam_Ra</val>, <val>
+                        Malayalam_Lla</val>, <val>Malayalam_Llla</val>, <val>Malayalam_Ssa</val>.
+                    </change>
+                    <change>New value for the <attr>InPC</attr> attribute: <val>Bottom_And_Left</val>.
+                    </change>
+                    <change>Modified patterns for the <attr>kIRG_GSource</attr>, <attr>kIRG_JSource</attr>, <attr>
+                        kIRG_KSource
+                    </attr> attributes.
+                    </change>
+                    <change>New code point attributes: <attr>vo</attr>,
+                        <attr>RI</attr>
+                    </change>
+                    <change>New code point attributes for Nushu data: <attr>kSrc_NushuDuben</attr> and <attr>
+                        kReading</attr>.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 20 being a proposed update, only changes between revisions 19 and 21 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="19" date="2016-05-30">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>9.0</val>.
+                    </change>
+                    <change>New values for the <attr>sc</attr> attribute: <val>Adlm</val>, <val>Bhks</val>, <val>
+                        Marc</val>, <val>Newa</val>, <val>Osge</val>, <val>Tang</val>.
+                    </change>
+                    <change>New values for the <attr>blk</attr> attribute: <val>Adlam</val>, <val>Bhaiksuki</val>, <val>
+                        Cyrillic_Ext_C</val>, <val>Glagolitic_Sup</val>, <val>Ideographic_Symbols</val>, <val>
+                        Marchen</val>, <val>Mongolian_Sup</val>, <val>Newa</val>, <val>Osage</val>, <val>
+                        Tangut</val>, <val>Tangut_Components</val>.
+                    </change>
+                    <change>New values for the <attr>gcb</attr> attribute: <val>EB</val>, <val>EBG</val>, <val>EM</val>, <val>
+                        GAZ</val>, <val>ZWJ</val>.
+                    </change>
+                    <change>New values for the <attr>wb</attr> attribute: <val>EB</val>, <val>EBG</val>, <val>EM</val>, <val>
+                        GAZ</val>, <val>ZWJ</val>.
+                    </change>
+                    <change>New values for the <attr>lb</attr> attribute: <val>EB</val>, <val>EM</val>, <val>ZWJ</val>.
+                    </change>
+                    <change>New values for the <attr>jg</attr> attribute: <val>African_Feh</val>, <val>
+                        African_Noon</val>, <val>African_Qaf</val>.
+                    </change>
+                    <change>New code point attributes: <attr>PCM</attr>, <attr>kRSTUnicode</attr> and <attr>
+                        kTGT_MergedSrc</attr>.
+                    </change>
+                    <change>Modified patterns for the <attr>kRSUnicode</attr>, <attr>kRSKangXi</attr>, <attr>
+                        kMandarin</attr>, <attr>kIRG_JSource</attr>, <attr>kIRG_USource</attr> and <attr>kFennIndex
+                    </attr> attributes.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 18 being a proposed update, only changes between revisions 17 and 19 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="17" date="2015-05-29">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>8.0</val>.
+                    </change>
+                    <change>New values for the <attr>sc</attr> attribute: <val>Ahom</val>, <val>Hatr</val>, <val>
+                        Hluw</val>, <val>Hung</val>, <val>Mult</val>, <val>Sgnw</val>.
+                    </change>
+                    <change>New values for the <attr>blk</attr> attribute: <val>Ahom</val>, <val>
+                        Anatolian_Hieroglyphs</val>, <val>Cherokee_Sup</val>, <val>CJK_Ext_E</val>, <val>
+                        Early_Dynastic_Cuneiform</val>, <val>Hatran</val>, <val>Multani</val>, <val>Old_Hungarian</val>, <val>
+                        Sup_Symbols_And_Pictographs</val>, <val>Sutton_SignWriting</val>.
+                    </change>
+                    <change>New values for the <attr>InSC</attr> attribute: <val>Consonant_Killer</val>, <val>
+                        Consonant_Prefixed</val>, <val>Consonant_With_Stacker</val>, <val>Syllable_Modifier</val>.
+                    </change>
+                    <change>New code point attributes: <attr>InPC</attr>, <attr>kJa</attr>.
+                    </change>
+                    <change>New patterns for the <attr>kIRG_GSource</attr> attribute: <val>GFC-</val>, <val>GGFZ-</val>.
+                    </change>
+                    <change>Switched the reference to ISO 19757 from :2003 and :2003 Amd1 to :2008.</change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 16 being a proposed update, only changes between revisions 15 and 17 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="15" date="2014-05-29">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>7.0</val>.
+                    </change>
+                    <change>New values for the <attr>jg</attr> attribute.
+                    </change>
+                    <change>New values for the <attr>sc</attr> attribute.
+                    </change>
+                    <change>New values for the <attr>blk</attr> attribute.
+                    </change>
+                    <change>New values for the <attr>InSC</attr> attribute.
+                    </change>
+                    <change>New values for the <attr>kIICore</attr> attribute.
+                    </change>
+                    <change>New values for the <attr>kIRG_GSource</attr> attribute.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 14 being a proposed update, only changes between revisions 13 and 15 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="13" date="2013-08-09">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>6.3</val>.
+                    </change>
+                    <change>New values <val>DQ</val>, <val>HL</val>, <val>SQ</val> for the <attr>WB</attr> attribute(forUnicode6.3).
+                    </change>
+                    <change>New code point attributes <attr>bpt</attr> and <attr>bpb</attr> (for Unicode 6.3).
+                    </change>
+                    <change>New values for the <attr>bc</attr> attribute: <val>LRI</val>, <val>RLI</val>, <val>FSI</val>, <val>
+                        PDI
+                    </val> (for Unicode 6.3).
+                    </change>
+                    <change>Updated the patterns for <attr>kHanyuPinlu</attr> and <attr>kTotalStrokes</attr> (for
+                        Unicode6.3).
+                    </change>
+                    <change>Updated the patterns for <attr>kIRG_HSource</attr> and <attr>kIRG_HSource</attr> (for
+                        Unicode6.2).
+                    </change>
+                    <change>Clarified that the child elements list-like elements are in no particular order.</change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 12 being a proposed update, only changes between revisions 11 and 13 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="11" date="2012-09-17">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>6.2</val>.
+                    </change>
+                    <change>New value for the <attr>gcb</attr>, <attr>wb</attr> and <attr>lb</attr> attributes:<val>
+                        RI
+                    </val> (for Unicode 6.2).
+                    </change>
+                    <change>Updated the patterns for <attr>kIRG_GSource</attr> and <attr>kIRG_HSource</attr> (for
+                        Unicode 6.2).
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 10 being a proposed update, only changes between revisions 9 and 11 are
+                noted here.
+            </proposed_update>
+            <revision revnumber="9" date="2012-01-25">
+                <changes>
+                    <change>Clarified the default values.</change>
+                    <change>Indicate that property values may change from one release to the next.</change>
+                    <change>Introduced the <attr>blk</attr> attributes, for the <prop>Block</prop> property.
+                    </change>
+                    <change>Introduced the <attr>scx</attr> attribute, for the <prop>ScriptExtensions</prop> property.
+                    </change>
+                    <change>Introduced the <elem>name-alias</elem> element, for the <prop>Name_Alias</prop> property.
+                    </change>
+                    <change>New value for the <attr>age</attr> attribute: <val>6.1</val>.
+                    </change>
+                    <change>New values for the <attr>script</attr> attribute: <val>Cakm</val>, <val>Merc</val>, <val>
+                        Mero</val>, <val>Plrd</val>, <val>Shrd</val>, <val>Sora</val>, <val>Takr</val>.
+                    </change>
+                    <change>New values for the <attr>lb</attr> attribute: <val>HL</val> and <val>CJ</val>.
+                    </change>
+                    <change>New value for the <attr>jg</attr> attribute: <val>Rohingya_Yeh</val>.
+                    </change>
+                    <change>The value of the <attr>fc_nfkc</attr> attribute must now be either # or <val>
+                        one-or-more-code-points</val>.
+                    </change>
+                    <change>For the <attr>nv</attr> attribute, the absence of a numeric value is now represented by<val>
+                        NaN
+                    </val> rather than by the empty string.
+                    </change>
+                    <change>The values of the <tattrt>ccc</tattrt> are now restricted to 0..254, instead of 0..255.
+                    </change>
+                    <change>Updated the patterns for <attr>kSemanticVariant</attr>, <attr>
+                        kSpecializedSemanticVariant</attr>, <attr>kIRG_USource</attr>, and <attr>kMandarin</attr>.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 8 being a proposed update, only changes between revisions 7 and 9 are noted
+                here.
+            </proposed_update>
+            <revision revnumber="7" date="2010-10-08">
+                <changes>
+                    <change>New value for the <attr>age</attr> attribute: <val>6.0</val>.
+                    </change>
+                    <change>New value for the <attr>jg</attr> attribute:
+                        <val>Teh_Marbuta_Goal</val>
+                    </change>
+                    <change>New values for the <attr>script</attr> attribute: <val>Batk</val>, <val>Brah</val>, <val>
+                        Mand</val>.
+                    </change>
+                    <change>Updated the patterns for <attr>kIRG_GSource</attr>, <attr>kIRG_HSource</attr>, <attr>
+                        kIRG_JSource</attr>, <attr>kIRG_KSource</attr>, <attr>kIRG_MSource</attr>, <attr>
+                        kIRG_TSource</attr>, <attr>kIRG_VSource</attr>.
+                    </change>
+                    <change>Added the <elem>InSC</elem> and <elem>InMC</elem> elements.
+                    </change>
+                    <change>Added the <elem>emoji-sources</elem> element.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 6 being a proposed update, only changes between revisions 5 and 7 are noted
+                here.
+            </proposed_update>
+            <revision revnumber="5" date="2009-09-17">
+                <changes>
+                    <change>Changed the type of <attr>block/@first-cp</attr>, <attr>block/@last-cp</attr> and <attr>
+                        normalization-corrections/@cp
+                    </attr> from <val>text</val> to
+                        <val>single-code-point</val>
+                    </change>
+                    <change>Changed the type of <attr>named-sequence/@cps</attr>, <attr>
+                        provisional-named-sequences/@cps</attr>, <attr>normalization-correction/@old</attr> and <attr>
+                        normalization-correction/@new
+                    </attr> from <val>text</val> to <val>one-or-more-code-points</val>.
+                    </change>
+                    <change>Changed the type of <attr>standardized-variants/@cps</attr> from <val>text</val> to <val>
+                        two-code-points</val>.
+                    </change>
+                    <change>New values for the <attr>jg</attr> attribute: <val>Farsi_Yeh</val> and <val>Nya</val>.
+                    </change>
+                    <change>New value for the <attr>age</attr> attribute: <val>5.2</val>.
+                    </change>
+                    <change>New values for the <attr>sc</attr> attribute: <val>Lana</val>, <val>Tavt</val>, <val>
+                        Avst</val>, <val>Egyp</val>, <val>Samr</val>, <val>Lisu</val>, <val>Bamu</val>, <val>Java</val>, <val>
+                        Mtei</val>, <val>Armi</val>, <val>Sarb</val>, <val>Prti</val>, <val>Phli</val>, <val>Orkh</val>, <val>
+                        Kthi</val>.
+                    </change>
+                    <change>New value for the <attr>lb</attr> attribute: <val>CP</val>.
+                    </change>
+                    <change>New value for the <attr>sc</attr> attribute: <val>Zinh</val>.
+                    </change>
+                    <change>New code point attributes <tattrt>CI</tattrt>, <attr>Cased</attr>, <attr>CWCF</attr>, <attr>
+                        CWCM</attr>, <attr>CWL</attr>, <attr>CWKCF</attr>, <attr>CWT</attr>, <attr>CWU</attr>, <attr>
+                        NFKC_CF</attr>.
+                    </change>
+                    <change>New attributes <attr>kHanyuPinyin</attr> and <attr>kIRG_MSource</attr>.
+                    </change>
+                    <change>New element
+                        <elem>cjk-radicals</elem>
+                    </change>
+                    <change>Updated the patterns for <attr>kIRG_GSource</attr>, <attr>kIRG_JSource</attr>, <attr>
+                        kIRG_KPSource</attr>, <attr>kIRG_KSource</attr>, <attr>kIRG_TSource</attr>, <attr>
+                        kIRG_VSource</attr>, <attr>kHanyuPinlu</attr>, <attr>kMandarin</attr>, <attr>
+                        kSemanticVariant</attr>, <attr>kSpecializedSemanticVariant</attr>, <attr>
+                        kVietnamese</attr>, <attr>kZVariant</attr>.
+                    </change>
+                    <change>Point out that Relax NG schemas do not modify or augment the infoset, and that it ispossible
+                        to convert mechanically our schema to other schema languages.
+                    </change>
+                </changes>
+            </revision>
+            <proposed_update>Revision 4 being a proposed update, only changes between revisions 3 and 5 are noted
+                here.
+            </proposed_update>
+            <revision revnumber="3" date="2008-04-01">
+                <changes>
+                    <change>First approved version, for Unicode 5.1.0.</change>
+                    <change>For optional elements which acts as collections, such as <elem>repertoire</elem> and <elem>
+                        named-sequences</elem>, impose that there be at least one element in the collection.
+                    </change>
+                    <change>Remove the constraint that the value <attr>jg</attr> is limited when <attr>jt</attr> has
+                        certainvalues; similarly for <attr>bmg</attr> / <attr>Bidi_M</attr> and for <attr>nv</attr> /
+                        <attr>nt</attr>.
+                    </change>
+                    <change>Value <val>NL</val> added to the <attr>WB</attr> attribute (for Unicode 5.1).
+                    </change>
+                    <change>Value <val>PP</val> added to the <attr>GCB</attr> attribute (for Unicode 5.1).
+                    </change>
+                    <change>Corrected the <val>Vai</val> script value to <val>Vaii</val>.
+                    </change>
+                    <change>Removed the discussion of elements or attributes in different namespace.</change>
+                    <change>Removed the <elem>code-point</elem> element.
+                    </change>
+                </changes>
+            </revision>
+            <revision revnumber="2" date="2007-12-14">
+                <changes>
+                    <change>Promoted to Draft UAX.</change>
+                    <change>Changed the title from "An XML representation of the UCD"</change>
+                    <change>Value <val>5.1</val> added to the <attr>age</attr> attribute (for Unicode 5.1).
+                    </change>
+                    <change>Value <val>SM</val> added to the <attr>gcb</attr> attribute (for Unicode 5.1).
+                    </change>
+                    <change>Values <val>CR</val>, <val>Extend</val>, <val>LF</val>, <val>MB</val> added to the <attr>
+                        WB
+                    </attr> attribute(forUnicode5.1).
+                    </change>
+                    <change>Values <val>CR</val>, <val>EX</val>, <val>LF</val>, <val>SC</val> added to the <attr>SB
+                    </attr> attribute(forUnicode5.1).
+                    </change>
+                    <change>Value <val>Burushaski_Yeh_Barree</val> added to the <attr>jg</attr> attribute (for
+                        Unicode5.1).
+                    </change>
+                    <change>Value <val>Alef_Maqsurah</val> added to the <attr>jg</attr> attribute (for Unicode 2.x).
+                    </change>
+                    <change>Values <val>Cari</val>, <val>Cham</val>, <val>Kali</val>, <val>Lepc</val>, <val>
+                        Lyci</val>, <val>Lydi</val>, <val>Olck</val>, <val>Rjng</val>, <val>Saur</val>, <val>Sund</val> and <val>
+                        Vai
+                    </val> added to the <attr>sc</attr> attribute (forUnicode5.0).
+                    </change>
+                    <change>
+                        <attr>jamo</attr>
+                        attribute renamed to
+                        <attr>JSN</attr>
+                    </change>
+                    <change>
+                        <attr>sfc</attr>
+                        attribute renamed to
+                        <attr>scf</attr>
+                    </change>
+                    <change>Attribute <attr>kXHC1983</attr> added (for Unicode 5.1.0).
+                    </change>
+                    <change>Pattern for attribute <attr>kIRG_USource</attr> extended (for Unicode 5.1.0).
+                    </change>
+                    <change>Element <elem>provisional-named-sequences</elem> added (for Unicode 5.0)
+                    </change>
+                </changes>
+            </revision>
+            <revision revnumber="1" date="2007-04-21">
+                <changes>
+                    <change>First working draft.</change>
+                </changes>
+            </revision>
+        </revhistory>
+    </articleinfo>
+
+    <abstract>
+        <para>This annex describes an XML representation of the Unicode Character Database.</para>
+    </abstract>
+
+
+    <!--========================================================================-->
+    <section>
+        <title>Introduction</title>
+        <para>In working on Unicode implementations, it is often useful to access the full content of the Unicode
+            Character Database (UCD). For example, in establishing mappings from characters to glyphs in fonts, it is
+            convenient to see the character scalar value, the character name, the character East Asian width, along with
+            the shape and metrics of the proposed glyph to map to; looking at all this data simultaneously helps in
+            evaluating the mapping.
+        </para>
+        <para>Directly accessing the data files that constitute the UCD is sometimes a daunting proposition. The data is
+            dispersed in a number of files of various formats, and there are just enough peculiarities (all justified by
+            the processing power available at the time the UCD representation was designed) to require a fairly intimate
+            knowledge of the data format itself, in addition to the meaning of the data.
+        </para>
+        <para>Many programming environments (for example, Java or ICU) do give access to the UCD. However, those
+            environments tend to lag behind releases of the standard, or support only some of the UCD content.
+        </para>
+        <para>Unibook is a wonderful tool to explore the UCD and in many cases is just the ticket; however, it is
+            difficult to use when the task at hand has not been built-in, or when non-UCD data is to be displayed as
+            well.
+        </para>
+        <para>This annex presents an alternative representation of the UCD, which is meant to overcome these
+            difficulties. We have chosen an XML representation, because parsing becomes a non-issue: there are a number
+            of XML parsers freely available, and using them is often fairly easy. In addition, there are freely
+            available tools that can perform powerful operations on XML data; for example, XPATH and XQUERY engines can
+            be thought of as a &#x201C;grep&#x201D; for XML data and XSLT engines can be thought of as
+            &#x201C;awk&#x201D; for XML data.
+        </para>
+        <para>It is important to note that we are interested in exploring the content of the UCD, rather than in using
+            the UCD data to process character streams. Thus, we are not concerned so much by the speed of processing or
+            the size of our representation.
+        </para>
+        <para>Our representation supports the creation of documents that represent only parts of the UCD, either by not
+            representing all the characters, or by not representing all the properties. This can be useful when only
+            some of the data is needed.
+        </para>
+        <para>This annex presents only the XML representation format of the UCD. The data itself is part of the <ulink
+                url='https://www.unicode.org/reports/tr41/tr41-34.html#UCD'>Unicode
+            Character Database</ulink>.
+        </para>
+    </section>
+
+
+    <!--========================================================================-->
+    <section>
+        <title>Overall schema</title>
+        <!--______________________________________________________________________-->
+        <section>
+            <title>General principles</title>
+            <para>Our schema can be used to create and validate documents which are intended to represent properties of
+                Unicode code points, blocks, named sequences, normalization corrections, standardized variants, CJK
+                radicals and emoji sources. A document may represent the values actually assigned in a given version of
+                the UCD, or it may represent a draft version of the UCD, or a private agreement on Private Use
+                characters. The validity of a XML document with respect to the schema defined in this annex does not
+                assert anything about the correctness of the values.
+            </para>
+            <para>Valid documents may provide values for only some of the code points, or some of the Unicode
+                properties. Furthermore, they may also incorporate non-Unicode properties.
+            </para>
+            <para>Our schema is defined using English. However, a useful subset of the validity constraints can be
+                captured using a schema language, thereby simplifying the task of validating documents. We have chosen
+                Relax NG [<ulink url='https://www.unicode.org/reports/tr41/tr41-34.html#ISO19757'>ISO 19757</ulink>],
+                in the compact syntax , as the schema language. It is important to stress that the schema which is
+                defined in English imposes more constraints on the documents than can be validated with the Relax NG
+                schema.
+            </para>
+            <para>An important characteristic of Relax NG is that its schemas do not modify or augment the infoset of
+                the documents. Therefore, it is possible to process our XML representation without using the schema.
+                Also, the schema is relatively straightforward and can be converted mechanically to other schema
+                languages.
+            </para>
+            <para>While our XML representation is not intended to be used during processing of characters and strings,
+                it is still a design principle for our schema to support the relatively efficient representation of the
+                UCD. This is achieved by an inheritance mechanism, similar to property inheritance in CSS or in XSL:FO
+                (see section <link linkend='group'>4.3 Group</link>).
+            </para>
+            <para>Many invariants impose constraints on the values of the different properties for a given code point.
+                For example, if the value of the <prop>Numeric Type</prop> property is None, then the value of the
+                <prop>Numeric Value</prop> property should be the empty string; and if the value of the <prop>Other
+                Alphabetic</prop> property is true, then the value of the <prop>Alphabetic</prop> property should be
+                true. Those invariants are not captured in the schema.
+            </para>
+        </section>
+
+        <!--______________________________________________________________________-->
+        <section>
+            <title>Namespace</title>
+            <para>The namespace for our elements is &#x201C;http://www.unicode.org/ns/2003/ucd/1.0&#x201D;. Our
+                attributes are in the empty namespace.
+            </para>
+            <!--Manual--><xi:include href="./fragments/namespace.xml"/>
+            <para>In all our examples, we assume that this namespace is the default one.
+            </para>
+        </section>
+
+        <!--______________________________________________________________________-->
+        <section>
+            <title>Datatypes</title>
+            <para>We use a standard XML Schema datatypes:</para>
+            <!--Manual--><xi:include href="./fragments/datatypes.xml"/>
+            <para>Characters are pervasive in the UCD, and will need to be represented. Representing characters directly
+                by themselves would seem the most obvious choice; for example, we could express that the decomposition
+                of U+00E8 is &#x201c;&amp;#x0065;&amp;#x0300;&#x201d;, that is have exactly two characters in (the
+                infoset of) the XML document. However, the current XML specification limits the set of characters
+                that can be part of a document. Another problem is that the various tools (XML parser, XPATH engine,
+                etc.) may equate U+00E8 with U+0065 U+0300, thus making it difficult to figure out which of the two
+                sequences is contained in the database (which is sometimes important for our purposes). Therefore, we
+                chose instead to represent characters by their code points; we follow the usual convention of four to
+                six hexadecimal digits (uppercase) and code points in a sequence separated by space; for example, the
+                decomposition of U+00E8 will be represented by the nine characters &#x201c;0065 0300&#x201d; in the
+                infoset.
+            </para>
+            <!--Manual--><xi:include href="./fragments/datatypes_code_points.xml"/>
+        </section>
+
+        <!--______________________________________________________________________-->
+        <section>
+            <title>Root Element</title>
+            <para>The root element of valid documents is a <elem>ucd</elem>.
+            </para>
+            <!--Manual--><xi:include href="./fragments/start.xml"/>
+        </section>
+
+        <!--______________________________________________________________________-->
+        <section>
+            <title>Common attributes</title>
+            <para>A large number of properties are boolean. We uniformly use the values <val>Y</val> and
+                <val>N</val> for those:
+            </para>
+            <xi:include href="./fragments/boolean.xml"/>
+        </section>
+
+        <!--______________________________________________________________________-->
+        <section>
+            <title>Ordering of elements</title>
+            <para>In elements that hold lists of child elements, such as <elem>repertoire</elem>,
+                <elem>group</elem>, or <elem>standardized-variants</elem>, the schema does not require that the
+                child elements be in any particular order.
+            </para>
+        </section>
+    </section>
+
+    <!--========================================================================-->
+    <section>
+        <title>Description</title>
+        <para>The root element may have a <elem>description</elem> child element, which in turn contains any string,
+            which is meant to describe what the XML document purports to describe.
+        </para>
+        <para>It is recommended that if the document purports to represent the UCD of some Unicode version, the
+            <elem>description</elem> be selected in accord with the rules listed in <ulink
+                    url='https://www.unicode.org/reports/tr41/tr41-34.html#Versions'>[Versions]</ulink>; and
+            conversely, that documents which do not purport to represent the UCD be described as such.
+        </para>
+        <!--Manual--><xi:include href="./fragments/description.xml"/>
+    </section>
+
+    <!--========================================================================-->
+    <section>
+        <title>Repertoire</title>
+        <para>The <elem>repertoire</elem> child element of the <elem>ucd</elem> element describes the code points and
+            their properties. As we will see shortly, code points can be described individually or as part of a group:
+        </para>
+        <!--Manual--><xi:include href="./fragments/repertoire.xml"/>
+
+        <!--______________________________________________________________________-->
+        <section>
+            <title>Sets of code points</title>
+            <para>It is often the case that successive code points have the same property values, for a given set of
+                properties. The most striking example is that of an unallocated plane, where all but the last two
+                code points are reserved and have the same property values. Another example is the URO (U+4E00
+                .. U+9FA5) where all the code points have the same property values if we ignore their name and their
+                Unihan properties.
+            </para>
+            <!--Manual--><xi:include href="./fragments/Set_of_code_points.xml"/>
+            <para>This observation suggests that it is profitable to represent sets of code points which share the
+                same properties, rather than individual code points. To make the representation of the sets simple,
+                we restrict them to be segments in the code point space, that is a set is defined by the first and
+                last code point it contains. Those are captured by the attributes <attr>first-cp</attr> and <attr>
+                    last-cp</attr>. The attribute <attr>cp</attr> is a shorthand notation for the case where the set
+                has a single code point.
+            </para>
+            <para>In the <elem>repertoire</elem>, there must be at most one <elem>code-point</elem>
+                element for a given code point.
+            </para>
+        </section>
+
+        <!--______________________________________________________________________-->
+        <section>
+            <title>Code point types</title>
+            <para>When thinking about Unicode code points, it is useful to split them into four types:
+            </para>
+            <itemizedlist>
+                <listitem>those assigned to abstract characters (PUA or not)</listitem>
+                <listitem>the noncharacters</listitem>
+                <listitem>the surrogate code points</listitem>
+                <listitem>the reserved code points</listitem>
+            </itemizedlist>
+            <para>This leads to four elements to describe sets of code points:
+            </para>
+            <!--Manual--><xi:include href="./fragments/repertoire_Code_points.xml"/>
+        </section>
+
+        <!--______________________________________________________________________-->
+        <section>
+            <title>Group</title>
+            <para>While we already recognized the situation where a set of code points have exactly the same set of
+                property values, another common situation is that of code points which have almost all the same
+                property values.
+            </para>
+            <para>For example, the characters U+1740 BUHID LETTER A .. U+1753 BUHID VOWEL SIGN U all have the age
+                &#x201C;3.2&#x201D;, and all have the script &#x201C;Buhd&#x201D;. On the one hand, it is convenient
+                to support data files in which those properties are explicitly listed with every code point, at this
+                makes answering questions like &#x201C;what is the age of U+1749?&#x201D; easier, because that data
+                is expressed right there. On the other hand, this leads to rather large data files, and it also tends
+                to obscure the differences between similar characters.
+            </para>
+
+            <para>Our representation accounts for this situation with the notion of groups. A
+                <elem>group</elem> element is simply a container of code points that also holds default values for
+                the properties. If a code point inside a <elem>group</elem> does not list explicitly a property but the
+                <elem>group</elem> lists it, then the code point inherits that property from its
+                <elem>group</elem>. For example, the fragment with explicit properties:
+            </para>
+            <codeblock>
+    &lt;char cp="1740" age="3.2" na="BUHID LETTER A" gc="Lo" sc="Buhd"/>
+    &lt;char cp="1741" age="3.2" na="BUHID LETTER I" gc="Lo" sc="Buhd"/>
+    &lt;char cp="1752" age="3.2" na="BUHID VOWEL SIGN I" gc="Mn" sc="Buhd"/>
+    &lt;char cp="1820" age="3.0" na="MONGOLIAN LETTER A" gc="Lo" sc="Mong"/></codeblock>
+            <para>is equivalent to this fragment which uses a <elem>group</elem>:
+            </para>
+            <codeblock>
+    &lt;group age="3.2" gc="Lo" sc="Buhd">
+        &lt;char cp="1740" na="BUHID LETTER A"/>
+        &lt;char cp="1741" na="BUHID LETTER I"/>
+        &lt;char cp="1752" na="BUHID VOWEL SIGN I" gc="Mn"/>
+        &lt;char cp="1820" age="3.0" na="MONGOLIAN LETTER A" sc="Mong"/>
+    &lt;/group></codeblock>
+            <para>The element for U+1740 does not have the <attr>age</attr> attribute, and it therefore inherits it
+                from its enclosing <elem>group</elem> element, that is &#x201C;3.2&#x201D;. On the other hand,
+                the element for U+1820 does have this attribute, so the value is &#x201C;3.0&#x201D;.
+            </para>
+            <para>As this example illustrates, the notion of <elem>group</elem> does not necessarily align with the
+                notion of Unicode block. It is entirely defined and limited to our representation. In particular, the
+                value of a property for a code point can always be determined from the XML document alone, assuming
+                that this property and this code point are expressed at all. Of course, one may create an XML
+                representation where the groups happen to coincide with the Unicode blocks.
+            </para>
+            <para>Groups cannot be nested. The motivation for this limitation is to make the life of consumers
+                easier: either a property is defined by the element for a code point, or it is defined by the
+                immediately enclosing <elem>group</elem> element.
+            </para>
+            <!--Manual--><xi:include href="./fragments/groups.xml"/>
+        </section>
+
+        <!--========================================================================-->
+        <section>
+            <title>Properties</title>
+            <para>Each property, except for the <prop>Special_Case_Condition</prop> and <prop>Name_Alias</prop>
+                properties, is represented by an attribute. In an XML data file, the absence of an attribute (may be
+                only on some <codephrase>code-point</codephrase>s) means that the document does not express the value
+                of the corresponding property. Conversely, the presence of an attribute is an expression of the
+                corresponding property value; the implied null value is represented by the empty string.
+            </para>
+            <para>The <prop>Name_Alias</prop> property is represented by zero or more <elem>name-alias</elem> child
+                elements. Unlike the situation for properties represented by attributes, it is not possible to determine
+                whether all the aliases have been represented in a data file by inspecting that data file.
+            </para>
+            <para>The name of an attribute is the abbreviated name of the property as given in the file
+                PropertyAliases.txt in the corresponding version of the UCD. For the Unihan
+                properties, the name is that given in the various versions of the Unihan database.
+            </para>
+            <para>For catalog and enumerated properties, the values are those listed in the file
+                PropertyValueAliases.txt in the corresponding version of the UCD; if there is an abbreviated
+                name, it is used, otherwise the long name is used.
+            </para>
+            <para>Note that the set of possible values for a property captured in this schema may change from one
+                version to the next.
+            </para>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Age property</title>
+                <para>The <elem>age</elem> attribute captures the version of Unicode in which a code point was
+                    assigned to an abstract character, or made a surrogate or non-character.
+                </para>
+                <xi:include href="./fragments/age.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Name properties</title>
+                <para>There are two name properties: the name given by the current version of the standard
+                    (<elem>na</elem>), and possibly the name this character had in version 1.0 of the standard
+                    (<elem>na1</elem>).
+                </para>
+                <xi:include href="./fragments/na.xml"/>
+                <xi:include href="./fragments/na1.xml"/>
+                <para>The majority of the characters in Unicode have a name which is of the form CJK UNIFIED
+                    IDEOGRAPH-<codephrase>&lt;code point&gt;</codephrase>. It also happens that character names cannot
+                    contain the character U+0023 &#x0023; NUMBER SIGN, so we adopted the following convention: if a
+                    code point has the attribute <attr>na</attr> (either directly or by inheritance from an enclosing
+                    group), then occurrences of the character # in the name are to be interpreted as the value of the
+                    code point. For example:
+                </para>
+                <codeblock>
+    &lt;char cp="3400" na="CJK UNIFIED IDEOGRAPH-3400"/></codeblock>
+                <para>and</para>
+                <codeblock>
+    &lt;char cp="3400" na="CJK UNIFIED IDEOGRAPH-#"/></codeblock>
+                <para>are equivalent. The # can be in any position in the value of the <attr>na</attr>
+                    attribute. The convention also applies just as well to a set of multiple code points:
+                </para>
+                <codeblock>
+    &lt;char cp="3400" na="CJK UNIFIED IDEOGRAPH-3400"/>
+    &lt;char cp="3401" na="CJK UNIFIED IDEOGRAPH-3401"/></codeblock>
+                <para>is equivalent to</para>
+                <codeblock>
+    &lt;char cp="3400" na="CJK UNIFIED IDEOGRAPH-#"/>
+    &lt;char cp="3401" na="CJK UNIFIED IDEOGRAPH-#"/></codeblock>
+                <para>which in turn is equivalent to:</para>
+                <codeblock>
+    &lt;char first-cp="3400" last-cp="3401" na="CJK UNIFIED IDEOGRAPH-#"/></codeblock>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Name Alias properties</title>
+                <para>The <prop>Name_Alias</prop> property is represented by zero or more <elem>name-alias</elem>
+                    child elements:
+                </para>
+                <xi:include href="./fragments/Name_Alias.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Block property</title>
+                <para>The <prop>Block</prop> property is represented by the <attr>blk</attr> attribute:
+                </para>
+                <xi:include href="./fragments/blk.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>General Category</title>
+                <para>The general category is represented by the <attr>gc</attr> attribute.
+                </para>
+                <xi:include href="./fragments/gc.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Combining properties</title>
+                <para>The combining class is represented by the <attr>ccc</attr> attribute, which holds the decimal
+                    representation of the combining class.
+                </para>
+                <para>Because the set of values that this property has taken across the various versions of the UCD
+                    is rather large, our schema does not restrict the possible values to those actually used.
+                </para>
+                <!--Manual--><xi:include href="./fragments/ccc.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Bidirectionality properties</title>
+                <para>The bidirectional class is represented by the <attr>bc</attr> attribute.
+                </para>
+                <xi:include href="./fragments/bc.xml"/>
+                <para>The mirrored property is represented by the <attr>Bidi_M</attr> attribute, which takes a
+                    boolean value.
+                </para>
+                <xi:include href="./fragments/Bidi_M.xml"/>
+                <para>The <attr>bmg</attr> attribute is the code point of a character whose glyph is typically
+                    a mirrored image of the glyph for the current character.
+                </para>
+                <xi:include href="./fragments/bmg.xml"/>
+                <para>Note that we do not express the &#x201c;Best Fit&#x201d; element recorded in BidiMirroring.txt.
+                    For one thing, it is not meant to be machine readable. More importantly, the idea underlying the
+                    mirrored glyph is delicate to use, since it makes assumptions about the design of the fonts, and
+                    the best fit goes even farther.
+                </para>
+                <para>The <prop>Bidi_Control</prop> property is represented by the <attr>Bidi_C</attr> attribute.
+                </para>
+                <xi:include href="./fragments/Bidi_C.xml"/>
+                <para>The bidi paired bracket type and bidi paired bracket properties are represented by the
+                    <attr>bpt</attr> and <attr>bpb</attr> attributes respectively.
+                </para>
+                <xi:include href="./fragments/bpt.xml"/>
+                <xi:include href="./fragments/bpb.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Decomposition properties</title>
+                <para>The decomposition type and decomposition mapping properties are represented by the <attr>dt</attr>
+                    and <attr>dm</attr> attributes.
+                </para>
+                <para>Most characters have a decomposition mapping to themselves. This is very similar to the
+                    situation we encountered with names, and we adopted a similar convention: if the value of a
+                    decomposition mapping is the character itself, we use the attribute value # (U+0023 &#x0023;
+                    NUMBER SIGN) as a shorthand notation; this enables those attributes to be captured in groups.
+                </para>
+                <xi:include href="./fragments/decomposition.xml"/>
+                <para>The properties <prop>Composition_Exclusion</prop> and <prop>Full_Composition_Exclusion</prop> are
+                    represented by the attributes <attr>CE</attr> and <attr>Comp_Ex</attr>:
+                </para>
+                <xi:include href="./fragments/composition.xml"/>
+                <para>The properties <prop>NFC_Quick_Check</prop>, <prop>NFD_Quick_Check</prop>,
+                    <prop>NFKC_Quick_Check</prop>, <prop>NFKD_Quick_Check</prop>, <prop>Expands_On_NFC</prop>,
+                    <prop>Expands_On_NFD</prop>, <prop>Expands_On_NFKC</prop>, <prop>Expands_On_NKFD</prop>,
+                    <prop>FC_NFKC_Closure</prop> have corresponding attributes.
+                </para>
+                <xi:include href="./fragments/quickcheck.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Numeric Properties</title>
+                <para>The numeric type is represented by the <attr>nt</attr> attribute.
+                </para>
+                <para>The numeric value is represented by the <attr>nv</attr> attribute, represented as a whole
+                    number or a fraction.
+                </para>
+                <xi:include href="./fragments/numeric.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Joining properties</title>
+                <para>The joining class of a character is represented by the <attr>jt</attr> attribute.
+                </para>
+                <para>The <attr>jg</attr> attribute is the joining group of the character.
+                </para>
+                <xi:include href="./fragments/joining.xml"/>
+                <para>The <prop>Join_Control</prop> property is represented by the <attr>Join_C</attr> attribute.
+                </para>
+                <xi:include href="./fragments/Join_C.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Linebreak properties</title>
+                <para>The <prop>Line_Break</prop> property is represented by the <attr>lb</attr> attribute.
+                </para>
+                <xi:include href="./fragments/lb.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>East Asian Width property</title>
+                <para>The East Asian width property is represented by the <attr>ea</attr> attribute.
+                </para>
+                <xi:include href="./fragments/ea.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Case properties</title>
+                <para>The <prop>Uppercase</prop>, <prop>Lowercase</prop>, <prop>Other_Uppercase</prop> and
+                    <prop>Other_Lowercase</prop> properties are represented by corresponding attributes.
+                </para>
+                <xi:include href="./fragments/casing.xml"/>
+                <para>Most characters have a case mapping and case folding properties that simply map or fold to
+                    themselves. This is very similar to the situation we encountered with names, and we adopted a
+                    similar convention: if the value of a case mapping or case folding property is the character
+                    itself, we use the attribute value # (U+0023 &#x0023; NUMBER SIGN) as a shorthand notation; this
+                    enables those attributes to be captured in groups.
+                </para>
+                <para>The simple case mappings are recorded in the <attr>suc</attr>, <attr>slc</attr>, <attr>stc</attr>
+                    attributes.
+                </para>
+                <xi:include href="./fragments/simple_case_mapping.xml"/>
+                <para>The non-simple casing are recorded in the <attr>uc</attr>, <attr>lc</attr> and <attr>tc</attr>
+                    attributes.
+                </para>
+                <xi:include href="./fragments/case_mapping.xml"/>
+                <para>The <prop>Simple_Case_Folding</prop> and <prop>Case_Folding</prop> properties are recorded in the
+                    <attr>scf</attr> and <attr>cf</attr> attributes respectively.
+                </para>
+                <xi:include href="./fragments/case_folding.xml"/>
+                <para>The <prop>Case_Ignorable</prop>, <prop>Cased</prop>, <prop>Changes_When_Casefolded</prop>,
+                    <prop>Changes_When_Casemapped</prop>, <prop>Changes_When_Lowercased</prop>,
+                    <prop>Changes_When_NFKC_Casefolded</prop>, <prop>Changes_When_Titlecased</prop>,
+                    <prop>Changes_When_Uppercased</prop>, <prop>NFKC_Casefold</prop>, and
+                    <prop>NFKC_Simple_Casefold</prop> properties are recorded in these attributes:
+                </para>
+                <xi:include href="./fragments/case_other.xml"/>
+                <para>Note that the UCD records more information about case folding than is expressed in the
+                    properties, specifically the entries in CaseFolding.txt with status T.
+                </para>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Script properties</title>
+                <para>The script and script extension properties are represented by the <attr>sc</attr> and
+                    <attr>scx</attr> attributes respectively.
+                </para>
+                <xi:include href="./fragments/script.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>ISO Comment properties</title>
+                <para>The ISO 10646 comment field is represented by the <attr>isc</attr> attribute.
+                </para>
+                <xi:include href="./fragments/isc.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Hangul properties</title>
+                <para>The property <prop>Hangul_Syllable_Type</prop> is represented by the <attr>hst</attr> attribute.
+                </para>
+                <xi:include href="./fragments/hst.xml"/>
+                <para>The property <prop>Jamo_Short_Name</prop> is represented by the <attr>JSN</attr> attribute:
+                </para>
+                <xi:include href="./fragments/JSN.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Indic properties</title>
+                <para>The property <prop>Indic_Syllabic_Category</prop> is represented by the <attr>InSC</attr>
+                    attribute.
+                </para>
+                <xi:include href="./fragments/InSC.xml"/>
+                <para>The property <prop>Indic_Positional_Category</prop> is represented by the <attr>InPC</attr>
+                    attribute:
+                </para>
+                <xi:include href="./fragments/InPC.xml"/>
+                <para>The property <prop>Indic_Conjunct_Break</prop> is represented by the <attr>InCB</attr> attribute:
+                </para>
+                <xi:include href="./fragments/InCB.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Identifier and Pattern and programming language properties</title>
+
+                <para>The properties <prop>ID_Start</prop>, <prop>Other_ID_Start</prop>, <prop>XID_Start</prop>,
+                    <prop>ID_Continue</prop>, <prop>Other_ID_Continue</prop>, <prop>XID_Continue</prop>,
+                    <prop>ID_Compat_Math_Start</prop>, and <prop>ID_Compat_Math_Continue</prop> are represented by
+                    corresponding attributes:
+                </para>
+                <xi:include href="./fragments/identifier.xml"/>
+                <para>The properties <prop>Pattern_Syntax</prop> and <prop>Pattern_White_Space</prop> are represented
+                    by corresponding attributes:
+                </para>
+                <xi:include href="./fragments/pattern.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Properties related to function and graphic characteristics</title>
+                <para>The properties <prop>Dash</prop>, <prop>Hyphen</prop>, <prop>Quotation_Mark</prop>,
+                    <prop>Terminal_Punctuation</prop>, <prop>Sentence_Terminal</prop>, <prop>Diacritic</prop>,
+                    <prop>Extender</prop>, <prop>Soft_Dotted</prop>, <prop>Alphabetic</prop>,
+                    <prop>Other_Alphabetic</prop>, <prop>Math</prop>, <prop>Other_Math</prop>, <prop>Hex_Digit</prop>,
+                    <prop>ASCII_Hex_Digit</prop>, <prop>Default_Ignorable_Code_Point</prop>,
+                    <prop>Other_Default_Ignorable_Code_Point</prop>, <prop>Logical_Order_Exception</prop>,
+                    <prop>Prepended_Concatenation_Mark</prop>, <prop>Modifier_Combining_Mark</prop>,
+                    <prop>White_Space</prop>, <prop>Vertical_Orientation</prop>, and <prop>Regional_Indicator</prop>
+                    describe the function or graphic characteristic of a character, and have each a corresponding
+                    attribute.
+                </para>
+                <xi:include href="./fragments/function_graphic.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Properties related to boundaries</title>
+                <para>The properties <prop>Grapheme_Base</prop>, <prop>Grapheme_Extend</prop>,
+                    <prop>Other_Grapheme_Extend</prop>, <prop>Grapheme_Link</prop>,
+                    <prop>Grapheme_Cluster_Break</prop>, <prop>Word_Break</prop>, and <prop>Sentence_Break</prop> each
+                    have a corresponding attribute:
+                </para>
+                <xi:include href="./fragments/boundaries.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Properties related to ideographs</title>
+                <para>The properties <prop>Ideographic</prop>, <prop>Unified_Ideograph</prop>,
+                    <prop>Equivalent_Unified_Ideograph</prop>, <prop>IDS_Binary_Operator</prop>,
+                    <prop>IDS_Trinary_Operator</prop>, <prop>IDS_Unary_Operator</prop>, and  <prop>Radical</prop> have
+                    corresponding attributes:
+                </para>
+                <xi:include href="./fragments/ideographs.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Miscellaneous properties</title>
+                <para>The properties <prop>Deprecated</prop>, <prop>Variation_Selector</prop>, and
+                    <prop>Noncharacter_Code_Point</prop> have corresponding attributes:
+                </para>
+                <xi:include href="./fragments/miscellaneous.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Unihan properties</title>
+                <para>The Unihan properties (from the Unihan database) are represented as attributes.
+                </para>
+                <xi:include href="./fragments/Unihan.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Tangut data</title>
+                <para>The Tangut data are represented as attributes. The attribute <attr>kRSTUnicode</attr>
+                    represents the radical stroke index. The attribute <attr>kTGT_MergedSrc</attr> indicates the
+                    source reference for the character.
+                </para>
+                <xi:include href="./fragments/Tangut.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Nushu data</title>
+                <para>The Nushu data are represented as attributes. The attribute <attr>kSrc_NushuDuben</attr>
+                    indicates the page number and order of the item from the NushuDuben reference source. Nushu common
+                    reading is represented as <attr>kReading</attr>.</para>
+                <xi:include href="./fragments/Nushu.xml"/>
+            </section>
+
+            <!--____________________________________________________________________-->
+            <section>
+                <title>Emoji properties</title>
+                <para>The properties <prop>Emoji</prop>, <prop>EPres</prop>, <prop>EMod</prop>, <prop>EBase</prop>,
+                    <prop>EComp</prop>, and <prop>ExtPict</prop> have corresponding attributes:
+                </para>
+                <xi:include href="./fragments/Emoji.xml"/>
+            </section>
+        </section>
+    </section>
+
+    <!--========================================================================-->
+    <section>
+        <title>Blocks</title>
+        <para>The <elem>blocks</elem> child of the <elem>ucd</elem> describes the blocks. It has one child
+            <elem>block</elem> element per block, with attributes to describe the extent and name of the block.
+        </para>
+        <xi:include href="./fragments/block.xml"/>
+    </section>
+
+    <!--========================================================================-->
+    <section>
+        <title>Named Sequences</title>
+        <para>The <elem>named-sequences</elem> child of the <elem>ucd</elem> describes the named sequences. It has one
+            child <elem>named-sequence</elem> element per named sequence, with attributes to describe the name and
+            sequence.
+        </para>
+        <para>Similarly, the <elem>provisional-named-sequences</elem> child of the <elem>ucd</elem> describes the
+            provisional named sequences.
+        </para>
+        <xi:include href="./fragments/named-sequences.xml"/>
+    </section>
+
+    <!--========================================================================-->
+    <section>
+        <title>Normalization Corrections</title>
+        <para>The <elem>normalization-corrections</elem> child of the <elem>ucd</elem> describes the normalization
+            corrections. It has one child <elem>normalization-correction</elem> element per correction, with
+            attributes to describe the code point affected, its old normalization, its new normalization and the
+            version of Unicode in which the correction was made.
+        </para>
+        <xi:include href="./fragments/normalization-corrections.xml"/>
+    </section>
+
+    <!--========================================================================-->
+    <section>
+        <title>Standardized Variants</title>
+        <para>The <elem>standardized-variants</elem> child of the <elem>ucd</elem> describes the standardized
+            variant. It has one child element <elem>standardized-variant</elem> per variant. The attributes on that
+            last element capture the variation sequence, the description of the desired appearance, and the shaping
+            environment under which the appearance is different.
+        </para>
+        <xi:include href="./fragments/standardized-variants.xml"/>
+    </section>
+
+    <!--========================================================================-->
+    <section>
+        <title>CJK Radicals</title>
+        <para>The <elem>cjk-radicals</elem> child of the <elem>ucd</elem> describes the CJK radicals. It has one
+            child element <elem>cjk-radical</elem> per radical. The attributes on that last element capture the
+            radical number, the corresponding CJK radical character, and the corresponding CJK unified ideograph.
+        </para>
+        <xi:include href="./fragments/cjk-radicals.xml"/>
+    </section>
+
+    <!--========================================================================-->
+    <section>
+        <title>Emoji sources</title>
+        <para>The <elem>emoji-sources</elem> child of the <elem>ucd</elem> describes the emoji sources.
+        </para>
+        <xi:include href="./fragments/emoji-sources.xml"/>
+
+        <xi:include href="./fragments/jis-code-point.xml"/>
+    </section>
+
+    <!--========================================================================-->
+    <section>
+        <title>Do Not Emit</title>
+        <para><phrase revisionflag='added'>The <elem>do-not-emit</elem> child of the <elem>ucd</elem> describes the
+            character sequences that should not be emitted or generated in newly authored texts.
+            </phrase>
+        </para>
+        <xi:include href="./fragments/do-not-emit.xml"/>
+    </section>
+
+    <!--========================================================================-->
+    <section>
+        <title>The full schema</title>
+        <para>Our schema is just the accumulation of the pieces we have described so far:
+        </para>
+        <ucdxml:schema title='UCD RelaxNG schema' file='ucd.rnc' method='text'>
+      <ucdxml:include linkend='schema.namespace'/>
+      <ucdxml:include linkend='schema.datatypes' title='datatypes'/>
+      <ucdxml:include linkend='schema.start'/>
+      <ucdxml:include linkend='schema.boolean'/>
+      <ucdxml:include linkend='schema.description'/>
+      <ucdxml:include linkend='schema.repertoire' title='repertoire'/>
+      <ucdxml:include linkend='schema.properties' title='attributes'/>
+      <ucdxml:include linkend='schema.tangut'/>
+      <ucdxml:include linkend='schema.nushu'/>
+      <ucdxml:include linkend='schema.block'/>
+      <ucdxml:include linkend='schema.named-sequences'/>
+      <ucdxml:include linkend='schema.normalization-corrections'/>
+      <ucdxml:include linkend='schema.standardized-variants'/>
+      <ucdxml:include linkend='schema.cjk-radicals'/>
+      <ucdxml:include linkend='schema.emoji-sources'/>
+      <ucdxml:include linkend='schema.emoji-data'/>
+      <ucdxml:include linkend='schema.do-not-emit'/>
+</ucdxml:schema>
+        <para>An expanded version is linked from the top of this document.</para>
+    </section>
+
+    <!--========================================================================-->
+    <section>
+        <title>Examples</title>
+        <para>Here is a fragment of the UCD for a few representative
+            characters (only some of the properties are represented):
+        </para>
+
+        <codeblock>
+            <![CDATA[
+  <ucd xmlns="http://www.unicode.org/ns/2003/ucd/1.0">
+    <repertoire>
+      <char cp="001F" age="1.1" na="&lt;control&gt;" na1="UNIT SEPARATOR"
+            gc="Cc" bc="S" lb="CM"/>
+
+      <char cp="0020" age="1.1" na="SPACE" gc="Zs" bc="WS" ea="Na" lb="SP"/>
+
+      <char cp="0026" age="1.1" na="AMPERSAND" gc="Po" bc="ON" ea="Na"/>
+
+      <char cp="0028" age="1.1" na="LEFT PARENTHESIS" na1="OPENING PARENTHESIS"
+            gc="Ps" bc="ON" Bidi_M="y" bmg="0029" ea="Na" lb="OP"/>
+
+      <char cp="0041" age="1.1" na="LATIN CAPITAL LETTER A"
+            gc="Lu" slc="0061" ea="Na" sc="Latn"/>
+
+      <char cp="AC00" age="2.0" na="HANGUL SYLLABLE GA" gc="Lo"
+            dt="can" dm="1100 1161" ea="W" lb="ID" sc="Hang"/>
+
+      <char cp="20094" age="3.1" na="CJK UNIFIED IDEOGRAPH-20094"
+            gc="Lo" ea="W" lb="ID" sc="Hani" kIRG_GSource="KX"
+            kIRGHanyuDaZidian="10036.060" kIRG_TSource="5-214E"
+           kRSUnicode="4.3" kIRGKangXi="0082.090"/>
+
+      <group age="3.2" gc="Lo" sc="Buhd">
+        <char cp="1740" na="BUHID LETTER A"/>
+        <char cp="1741" na="BUHID LETTER I"/>
+        <char cp="1752" na="BUHID VOWEL SIGN I" gc="Mn"/>
+        <char cp="1820" age="3.0" na="MONGOLIAN LETTER A" sc="Mong"/>
+      </group>
+    </repertoire>
+  </ucd>
+]]>
+</codeblock>
+    </section>
+
+    <!--========================================================================-->
+    <acknowledgments>
+        <title>Acknowledgments</title>
+        <para>Thanks to Markus Scherer and Mark Davis for their help developing this XML representation. Thanks to
+            the reviewers: Julie Allen, Ernest van den Boogaard, Daniel B&#x00FC;nzli, John Cowan, Asmus Freytag,
+            Felix Sasaki, Andrew West. Special thanks to Eric Muller and Laurențiu Iancu.
+        </para>
+    </acknowledgments>
+</article>
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/index2html.xsl b/unicodetools/src/main/resources/org/unicode/uax42/index2html.xsl
new file mode 100644
index 000000000..f0a95fa95
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/index2html.xsl
@@ -0,0 +1,611 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<xsl:stylesheet
+  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+  xmlns:unicode="http://unicode.org/ns/2001"
+  xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml"
+  xmlns="http://www.w3.org/1999/xhtml"
+  exclude-result-prefixes="unicode"
+  version="2.0">
+
+  <xsl:output
+          method="xml"
+          omit-xml-declaration="yes"
+          indent="yes"
+          doctype-public="-//W3C//DTD XHTML 1.0 Transitional//EN"
+          doctype-system="http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"
+          encoding="UTF-8"/>
+
+<!-- Start of the article, headings, and version table -->
+
+  <xsl:template match="article">
+<!--    For debugging-->
+<!--    <xsl:comment>-->
+<!--      XSLT Version = <xsl:copy-of select="system-property('xsl:version')"/>-->
+<!--      XSLT Vendor = <xsl:copy-of select="system-property('xsl:vendor')"/>-->
+<!--      XSLT Vendor URL = <xsl:copy-of select="system-property('xsl:vendor-url')"/>-->
+<!--    </xsl:comment>-->
+    <html>
+      <head>
+        <meta http-equiv="content-type" content="text/html; charset=UTF-8" />
+        <link rel="stylesheet" type="text/css" href="https://www.unicode.org/reports/reports-v2.css" />
+        <title>
+          <xsl:choose>
+            <xsl:when test="articleinfo/unicode:tr/@class='uax'">
+              <xsl:text>UAX</xsl:text>
+            </xsl:when>
+            <xsl:when test="articleinfo/unicode:tr/@class='uts'">
+              <xsl:text>UTS</xsl:text>
+            </xsl:when>
+            <xsl:when test="articleinfo/unicode:tr/@class='utr'">
+              <xsl:text>UTR</xsl:text>
+            </xsl:when>
+          </xsl:choose>
+          <xsl:text> #</xsl:text>
+          <xsl:value-of select="articleinfo/unicode:tr/@number"/>
+          <xsl:text>: </xsl:text>
+          <xsl:value-of select="title"/>
+        </title>
+      </head>
+      <body style="background-color:#ffffff">
+        <table class="header" cellpadding="0" cellspacing="0" width="100%">
+          <tbody>
+            <tr>
+              <td class="icon">
+                <a href="https://www.unicode.org/">
+                  <img style="vertical-align:middle;border:0" alt="[Unicode]"
+                       src="https://www.unicode.org/webscripts/logo60s2.gif" height="33" width="34" />
+                </a>&#x00A0;<a class="bar" href="https://www.unicode.org/reports/">Technical Reports</a>
+              </td>
+            </tr>
+            <tr>
+              <td class="gray">&#x00A0;</td>
+            </tr>
+          </tbody>
+        </table>
+        <div class="body">
+          <h2 style="text-align:center">
+            <xsl:call-template name="display-stage"/>
+            <xsl:text> </xsl:text>
+            <xsl:choose>
+              <xsl:when test="articleinfo/unicode:tr/@class='uax'">
+                <xsl:text>Unicode® Standard Annex</xsl:text>
+              </xsl:when>
+              <xsl:when test="articleinfo/unicode:tr/@class='uts'">
+                <xsl:text>Unicode® Technical Standard</xsl:text>
+              </xsl:when>
+              <xsl:when test="articleinfo/unicode:tr/@class='utr'">
+                <xsl:text>Unicode® Technical Report</xsl:text>
+              </xsl:when>
+            </xsl:choose>
+            <xsl:text> #</xsl:text>
+            <xsl:value-of select="articleinfo/unicode:tr/@number"/>
+          </h2>
+          <h1 style="text-align:center"><xsl:value-of select="title"/></h1>
+          <!-- Here"s where we add all sections of the document -->
+          <xsl:call-template name="generate-body"/>
+        </div>
+      </body>
+    </html>
+  </xsl:template>
+
+  <xsl:template name="generate-body">
+    <xsl:call-template name="version-info"/>
+    <xsl:apply-templates select="abstract"/>
+    <xsl:call-template name="status"/>
+    <xsl:call-template name="toc"/>
+    <hr/>
+    <xsl:apply-templates select="section|acknowledgments"/>
+    <h2><a name="Modifications">Modifications</a></h2>
+    <p>This section indicates the changes introduced by each revision.</p>
+    <xsl:apply-templates select="articleinfo/revhistory"/>
+    <hr/>
+    <xsl:call-template name="copyright"/>
+  </xsl:template>
+
+  <xsl:template name="display-stage">
+    <xsl:choose>
+      <xsl:when test="articleinfo/unicode:tr/@stage='working-draft'">
+        <span style="background-color: #ffff00; border-style:dotted; border-width:1px"><xsl:text>Working draft</xsl:text></span>
+      </xsl:when>
+      <xsl:when test="articleinfo/unicode:tr/@stage='proposed-update'">
+        <span style="background-color: #ffff00; border-style:dotted; border-width:1px"><xsl:text>Proposed Update</xsl:text></span>
+      </xsl:when>
+    </xsl:choose>
+  </xsl:template>
+
+  <xsl:template name="version-info">
+
+    <xsl:param name="thisnumber">
+      <xsl:value-of select="articleinfo/unicode:tr/@number"/>
+    </xsl:param>
+
+    <xsl:param name="thisrev">
+      <xsl:value-of select="articleinfo/revhistory/revision[1]/@revnumber"/>
+    </xsl:param>
+
+    <xsl:param name="thisurl">
+      <xsl:text>https://www.unicode.org/reports/tr</xsl:text>
+      <xsl:value-of select="$thisnumber"/>
+      <xsl:text>/tr</xsl:text>
+      <xsl:value-of select="$thisnumber"/>
+      <xsl:text>-</xsl:text>
+      <xsl:value-of select="$thisrev"/>
+      <xsl:text>.html</xsl:text>
+    </xsl:param>
+
+    <xsl:param name="prevrev">
+      <xsl:value-of select="articleinfo/unicode:tr/@prevrev"/>
+    </xsl:param>
+
+    <xsl:param name="prevurl">
+      <xsl:text>https://www.unicode.org/reports/tr</xsl:text>
+      <xsl:value-of select="$thisnumber"/>
+      <xsl:text>/tr</xsl:text>
+      <xsl:value-of select="$thisnumber"/>
+      <xsl:text>-</xsl:text>
+      <xsl:value-of select="$prevrev"/>
+      <xsl:text>.html</xsl:text>
+    </xsl:param>
+
+    <xsl:param name="latesturl">
+      <xsl:text>https://www.unicode.org/reports/tr</xsl:text>
+      <xsl:value-of select="$thisnumber"/>
+      <xsl:text>/</xsl:text>
+    </xsl:param>
+
+    <xsl:param name="thisschema">
+      <xsl:text>https://www.unicode.org/reports/tr</xsl:text>
+      <xsl:value-of select="$thisnumber"/>
+      <xsl:text>/tr</xsl:text>
+      <xsl:value-of select="$thisnumber"/>
+      <xsl:text>-</xsl:text>
+      <xsl:value-of select="$thisrev"/>
+      <xsl:text>.rnc</xsl:text>
+    </xsl:param>
+
+    <table class="simple" width="90%">
+      <tbody>
+        <tr>
+          <td valign="top" width="20%">Version</td>
+          <td valign="top">
+            <xsl:if test="//article/articleinfo/unicode:tr/@class='uax'">Unicode </xsl:if>
+            <span>
+              <xsl:call-template name="apply-draft-highlighting"/>
+              <xsl:value-of select="articleinfo/unicode:tr/@version"/>
+            </span>
+          </td>
+        </tr>
+        <tr>
+          <td valign="top">
+            <xsl:choose>
+              <xsl:when test="count(articleinfo/authors/author)=1">
+                Editor
+              </xsl:when>
+              <xsl:otherwise>
+                Editors
+              </xsl:otherwise>
+            </xsl:choose>
+          </td>
+          <td valign="top">
+            <xsl:apply-templates select="articleinfo/authors"/>
+          </td>
+        </tr>
+        <tr>
+          <td valign="top">Date</td>
+          <td valign="top">
+            <span>
+              <xsl:call-template name="apply-draft-highlighting"/>
+              <xsl:value-of select="articleinfo/revhistory/revision[1]/@date"/>
+            </span>
+          </td>
+        </tr>
+        <tr>
+          <td valign="top">This Version</td>
+          <td valign="top">
+            <span>
+              <xsl:call-template name="apply-draft-highlighting"/>
+              <a href="{$thisurl}"><xsl:value-of select="$thisurl"/></a>
+            </span>
+          </td>
+        </tr>
+        <tr>
+          <td valign="top">Previous Version</td>
+          <td valign="top">
+            <xsl:choose>
+              <xsl:when test="$prevrev = ''">
+                <xsl:text>n/a</xsl:text>
+              </xsl:when>
+              <xsl:otherwise>
+                <span>
+                  <xsl:call-template name="apply-draft-highlighting"/>
+                  <a href="{$prevurl}"><xsl:value-of select="$prevurl"/></a>
+                </span>
+              </xsl:otherwise>
+            </xsl:choose>
+          </td>
+        </tr>
+        <tr>
+          <td valign="top">Latest Version</td>
+          <td valign="top">
+            <a href="{$latesturl}"><xsl:value-of select="$latesturl"/></a>
+          </td>
+        </tr>
+        <tr>
+          <td valign="top">Latest Proposed Update</td>
+          <td valign="top">
+            <a href="{$latesturl}proposed.html"><xsl:value-of select="$latesturl"/>proposed.html</a>
+          </td>
+        </tr>
+        <xsl:if test="articleinfo/unicode:tr/@schema">
+          <tr>
+            <td valign="top">Schema</td>
+            <td valign="top">
+              <span>
+                <xsl:call-template name="apply-draft-highlighting"/>
+                <a href="{$thisschema}"><xsl:value-of select="$thisschema"/></a>
+              </span>
+            </td>
+          </tr>
+        </xsl:if>
+        <tr>
+          <td valign="top">Revision</td>
+          <td valign="top">
+            <a href="#Modifications">
+              <span>
+                <xsl:call-template name="apply-draft-highlighting"/>
+                <xsl:value-of select="$thisrev"/>
+              </span>
+            </a>
+          </td>
+        </tr>
+      </tbody>
+    </table>
+  </xsl:template>
+
+  <xsl:template match="authors">
+    <xsl:apply-templates/>
+  </xsl:template>
+
+  <xsl:template match="author">
+    <xsl:value-of select="firstname"/>
+    <xsl:text> </xsl:text>
+    <xsl:value-of select="surname"/>
+    <xsl:apply-templates select="email"/><br/>
+  </xsl:template>
+
+  <xsl:template match="email">
+    <xsl:text> (</xsl:text>
+    <a><xsl:attribute name="href">mailto:<xsl:value-of select="."/></xsl:attribute><xsl:value-of select="."/></a>
+    <xsl:text>)</xsl:text>
+  </xsl:template>
+
+  <!-- Summary/Abstract -->
+
+  <xsl:template match="abstract">
+    <h4 style="margin-top: 1em;">Summary</h4>
+    <xsl:apply-templates/>
+  </xsl:template>
+
+  <xsl:template match="abstract/para">
+    <p><i><xsl:apply-templates/></i></p>
+  </xsl:template>
+
+  <!-- Status -->
+
+  <xsl:template name="status">
+    <h4><i>Status</i></h4>
+    <xsl:choose>
+      <xsl:when test="articleinfo/unicode:tr/@stage='approved'">
+        <p><i>This document has been reviewed by Unicode members and other interested parties, and has been
+          approved for publication by the Unicode Consortium. This is a stable document and may be used as reference
+          material or cited as a normative reference by other specifications.</i></p>
+      </xsl:when>
+      <xsl:otherwise>
+        <p>
+          <xsl:call-template name="apply-draft-highlighting"/>
+          <i>This is a <b><span style="color:#ff0000">draft</span></b> document which may be updated, replaced, or
+            superseded by other documents at any time. Publication does not imply endorsement by the Unicode
+            Consortium.  This is not a stable document; it is inappropriate to cite this document as other than a
+            work in progress.</i></p>
+      </xsl:otherwise>
+    </xsl:choose>
+    <xsl:choose>
+      <xsl:when test="articleinfo/unicode:tr/@class='uax'">
+        <blockquote>
+          <p><i><b>A Unicode Standard Annex (UAX)</b> forms an integral part of the Unicode Standard, but is
+            published online as a separate document. The Unicode Standard may require conformance to normative
+            content in a Unicode Standard Annex, if so specified in the Conformance chapter of that version of the
+            Unicode Standard. The version number of a UAX document corresponds to the version of the Unicode Standard
+            of which it forms a part.</i></p>
+        </blockquote>
+        <p><i>Please submit corrigenda and other comments with the online reporting form [<a
+                href="https://www.unicode.org/reporting.html">Feedback</a>]. Related information that is useful in
+          understanding this annex is found in Unicode Standard Annex #41, &#x201C;<a
+                  href="https://www.unicode.org/reports/tr41/tr41-32.html">Common References for Unicode Standard
+            Annexes.</a>&#x201D; For the latest version of the Unicode Standard, see [<a
+                  href="https://www.unicode.org/versions/latest/">Unicode</a>]. For a list of current Unicode
+          Technical Reports, see [<a href="https://www.unicode.org/reports/">Reports</a>]. For more information about
+          versions of the Unicode Standard, see [<a href="https://www.unicode.org/versions/">Versions</a>]. For any
+          errata which may apply to this annex, see [<a href="https://www.unicode.org/errata/">Errata</a>].</i></p>
+      </xsl:when>
+      <xsl:when test="articleinfo/unicode:tr/@class='uts'">
+        <blockquote>
+          <p><i><b>A Unicode Technical Standard (UTS)</b> is an independent specification. Conformance to the Unicode
+            Standard does not imply conformance to any UTS.</i></p>
+        </blockquote>
+        <p><i>Please submit corrigenda and other comments with the online reporting form [<a href="#biblio_feedback">
+          Feedback</a>]. Related information that is useful in understanding this document is found in <a
+                href="#references">References</a>.  For the latest version of the Unicode Standard see [<a
+                href="#biblio_unicode">Unicode</a>]. For a list of current Unicode Technical Reports see [<a
+                href="#biblio_reports">Reports</a>]. For more information about versions of the Unicode Standard, see
+          [<a href="#biblio_versions">Versions</a>].</i></p>
+      </xsl:when>
+      <xsl:when test="articleinfo/unicode:tr/@class='utr'">
+        <blockquote>
+          <p><i><b>A Unicode Technical Report (UTR)</b> contains informative material. Conformance to the Unicode
+            Standard does not imply conformance to any UTR. Other specifications, however, are free to make normative
+            references to a UTR.</i></p>
+        </blockquote>
+        <p><i>Please submit corrigenda and other comments with the online reporting form [<a href="#biblio_feedback">
+          Feedback</a>]. Related information that is useful in understanding this document is found in <a
+                href="#references">References</a>.  For the latest version of the Unicode Standard see [<a
+                href="#biblio_unicode">Unicode</a>]. For a list of current Unicode Technical Reports see [<a
+                href="#biblio_reports">Reports</a>]. For more information about versions of the Unicode Standard, see
+          [<a href="#biblio_versions">Versions</a>].</i></p>
+      </xsl:when>
+    </xsl:choose>
+  </xsl:template>
+
+  <!-- Table of Contents -->
+
+  <xsl:template name="toc">
+    <h4>Contents</h4>
+    <ul class="toc">
+      <xsl:apply-templates mode="toc"/>
+      <li>
+        <a href="#Modifications">Modifications</a>
+      </li>
+    </ul>
+  </xsl:template>
+
+  <xsl:template match="section|acknowledgments" mode="toc">
+    <li>
+      <xsl:apply-templates select="title" mode="toc"/>
+      <xsl:if test="section">
+        <ul class="toc">
+          <xsl:apply-templates select="section|acknowledgements" mode="toc"/>
+        </ul>
+      </xsl:if>
+    </li>
+  </xsl:template>
+
+  <xsl:template match="section/title" mode="toc">
+    <xsl:param name="id">
+      <xsl:call-template name="parentid"/>
+    </xsl:param>
+    <xsl:number level="multiple" count="section" format="1.1"/>
+    <xsl:text>&#x00A0;&#x00A0;&#x00A0;&#x00A0;</xsl:text>
+    <a href="#{$id}">
+      <xsl:apply-templates/>
+    </a>
+  </xsl:template>
+
+  <xsl:template match="acknowledgments/title" mode="toc">
+    <xsl:param name="id">
+      <xsl:call-template name="parentid"/>
+    </xsl:param>
+    <a href="#{$id}">
+      <xsl:apply-templates/>
+    </a>
+  </xsl:template>
+
+  <xsl:template match="*|text()" mode="toc"/>
+
+  <!-- Sections -->
+
+  <xsl:template match="section/title">
+    <xsl:param name="id">
+      <xsl:call-template name="parentid"/>
+    </xsl:param>
+    <xsl:element name="h{count(ancestor::section)+1}">
+      <a name="{$id}">
+        <xsl:number level="multiple" count="section" format="1.1"/>
+        <xsl:text> </xsl:text>
+        <xsl:apply-templates/>
+      </a>
+    </xsl:element>
+  </xsl:template>
+
+  <xsl:template match="acknowledgments/title">
+    <xsl:param name="id">
+      <xsl:call-template name="parentid"/>
+    </xsl:param>
+    <h2>
+      <a name="{$id}">
+        <xsl:apply-templates/>
+      </a>
+    </h2>
+  </xsl:template>
+
+  <xsl:template match="para">
+    <p><xsl:apply-templates/></p>
+  </xsl:template>
+
+  <xsl:template match="codeblock">
+    <pre><xsl:apply-templates/></pre>
+  </xsl:template>
+
+  <xsl:template match="codephrase">
+    <code><xsl:apply-templates/></code>
+  </xsl:template>
+
+  <xsl:template match="ulink">
+    <a href="{@url}">
+      <xsl:if test="@type='newwindow'">
+        <xsl:attribute name="target">_blank</xsl:attribute>
+      </xsl:if>
+      <xsl:choose>
+        <xsl:when test="text()">
+          <xsl:apply-templates/>
+        </xsl:when>
+        <xsl:otherwise>
+          <xsl:value-of select="@url"/>
+        </xsl:otherwise>
+      </xsl:choose>
+    </a>
+  </xsl:template>
+
+  <xsl:preserve-space elements="ucdxml:block"/>
+
+  <xsl:key name="ucdxml-key" match="ucdxml:block" use="@id"/>
+
+  <xsl:template match="ucdxml:include">
+    <i>
+      <xsl:text>[</xsl:text>
+        <xsl:choose>
+          <xsl:when test="@title">
+            <xsl:value-of select="@title"/>
+          </xsl:when>
+          <xsl:when test="count (key ('ucdxml-key', @linkend)) = 1">
+            <xsl:value-of select="key ('ucdxml-key', @linkend)/@title"/>
+          </xsl:when>
+          <xsl:otherwise>
+            <xsl:value-of select="@linkend"/>
+          </xsl:otherwise>
+        </xsl:choose>
+        <xsl:text>: </xsl:text>
+        <xsl:for-each select="key('ucdxml-key',@linkend)">
+          <a href="#ucdxml:{generate-id ()}"><xsl:number count="ucdxml:block" level="any"/></a>
+          <xsl:if test="position() != last ()">, </xsl:if></xsl:for-each><xsl:text>]</xsl:text>
+    </i>
+  </xsl:template>
+
+  <xsl:template match="ucdxml:block">
+    <p>
+      <i><a name="ucdxml:{generate-id()}">[<xsl:value-of select="@title"/>,
+        <xsl:number count="ucdxml:block" level="any"/>]
+      </a>
+        =</i>
+      <tt style="white-space: pre;">
+        <xsl:apply-templates/>
+      </tt>
+    </p>
+  </xsl:template>
+
+  <xsl:template match="ucdxml:schema">
+    <p>
+      <i><a name="ucdxml:{generate-id()}">[<xsl:value-of select="@title"/>]
+      </a>
+        =</i>
+      <xsl:apply-templates/>
+    </p>
+  </xsl:template>
+
+  <xsl:template match="ucdxml:schema/text()">
+    <tt style="white-space: pre;"><xsl:value-of select="."/></tt>
+  </xsl:template>
+
+  <!-- Revision history aka. Modifications -->
+
+  <xsl:template match="revision">
+    <div>
+      <p>
+        <b>Revision <xsl:value-of select="@revnumber"/></b>
+      </p>
+      <xsl:apply-templates/>
+    </div>
+  </xsl:template>
+
+  <xsl:template match="proposed_update">
+    <div>
+      <p>
+        <xsl:apply-templates/>
+      </p>
+    </div>
+  </xsl:template>
+
+  <xsl:template match="changes">
+    <ul>
+      <xsl:apply-templates/>
+    </ul>
+  </xsl:template>
+
+  <xsl:template match="change">
+    <li>
+      <xsl:apply-templates/>
+    </li>
+  </xsl:template>
+
+  <!-- Copyright -->
+
+  <xsl:template name="copyright">
+    <p class="copyright">&#xa9; 2008–<xsl:apply-templates select="articleinfo/copyright/year"/> Unicode, Inc. This
+      publication is protected by copyright, and permission must be obtained from Unicode, Inc. prior to any
+      reproduction, modification, or other use not permitted by the
+      <a href="https://www.unicode.org/copyright.html">Terms of Use</a>. Specifically, you may make copies of this
+      publication and may annotate and translate it solely for personal or internal business purposes and not for
+      public distribution, provided that any such permitted copies and modifications fully reproduce all copyright and
+      other legal notices contained in the original. You may not make copies of or modifications to this publication
+      for public distribution, or incorporate it in whole or in part into any product or publication without the
+      express written permission of Unicode.</p>
+
+    <p class="copyright">Use of all Unicode Products, including this publication, is governed by the Unicode
+      <a href="https://www.unicode.org/copyright.html">Terms of Use</a>. The authors, contributors, and publishers have
+      taken care in the preparation of this publication, but make no express or implied representation or warranty of
+      any kind and assume no responsibility or liability for errors or omissions or for consequential or incidental
+      damages that may arise therefrom. This publication is provided “AS-IS” without charge as a convenience to
+      users.</p>
+
+    <p class="copyright">Unicode and the Unicode Logo are registered trademarks of Unicode, Inc., in the United States
+      and other countries.</p>
+  </xsl:template>
+
+  <!-- Common templates -->
+
+  <xsl:template name="apply-draft-highlighting">
+    <xsl:if test="//article/articleinfo/unicode:tr/@stage='proposed-update'">
+      <xsl:attribute name="style">background-color: #ffff00; border-style:dotted; border-width:1px</xsl:attribute>
+    </xsl:if>
+  </xsl:template>
+
+  <xsl:template name="parentid">
+    <xsl:choose>
+      <xsl:when test="../@id">
+        <xsl:value-of select="../@id"/>
+      </xsl:when>
+      <xsl:otherwise>
+        <xsl:value-of select="generate-id()"/>
+      </xsl:otherwise>
+    </xsl:choose>
+  </xsl:template>
+
+  <xsl:template match="prop">
+    <xsl:apply-templates/>
+  </xsl:template>
+
+  <xsl:template match="elem">
+    <tt><xsl:apply-templates/></tt>
+  </xsl:template>
+
+  <xsl:template match="attr">
+    <tt><xsl:apply-templates/></tt>
+  </xsl:template>
+
+  <xsl:template match="val">
+    <tt><xsl:apply-templates/></tt>
+  </xsl:template>
+
+  <xsl:template match="phrase[@revisionflag='added']">
+    <span style="background-color: #ffff00; border-style:dotted; border-width:1px">
+      <xsl:apply-templates/>
+    </span>
+  </xsl:template>
+
+  <xsl:template match="phrase[@revisionflag='modified']">
+    <span style="background-color: #ffff00; border-style:dotted; border-width:1px">
+      <xsl:apply-templates/>
+    </span>
+  </xsl:template>
+
+</xsl:stylesheet>
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/index2rnc.xsl b/unicodetools/src/main/resources/org/unicode/uax42/index2rnc.xsl
new file mode 100644
index 000000000..b7a8dfa81
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/index2rnc.xsl
@@ -0,0 +1,45 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<xsl:stylesheet 
+  xmlns:xsl="http://www.w3.org/1999/XSL/Transform"
+  xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml"
+  xmlns="http://www.w3.org/TR/REC-html40"
+  version="2.0">
+
+  <xsl:output
+          method="text"
+          encoding="UTF-8"/>
+
+  <xsl:template match='/'>
+    <xsl:apply-templates select='/descendant::ucdxml:schema[@file]'/>
+  </xsl:template>
+
+  <xsl:template match='ucdxml:schema[@file]'>
+    # Copyright &#x00A9; <xsl:value-of select='/article/articleinfo/copyright/year'/> Unicode, Inc.
+
+    <xsl:apply-templates/>
+  </xsl:template>
+
+  <xsl:template match='ucdxml:block[@revisionflag="deleted"]'/>
+
+  <xsl:key name='block-key' match='ucdxml:block' use='@id'/>
+
+  <xsl:template match='ucdxml:include'>
+    <xsl:apply-templates select='key("block-key", @linkend)'/>
+  </xsl:template>
+
+  <xsl:template match='phrase[@revisionflag="deleted"]'/>
+
+  <xsl:template match='phrase[@revisionflag="added"]'>
+    <xsl:apply-templates/>
+  </xsl:template>
+
+  <xsl:template match='@* | node()'>
+    <xsl:copy>
+      <xsl:apply-templates select='@* | node()'/>
+    </xsl:copy>
+  </xsl:template>
+
+  <xsl:template match="JRW"/>
+
+</xsl:stylesheet>
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/output/index.html b/unicodetools/src/main/resources/org/unicode/uax42/output/index.html
new file mode 100644
index 000000000..13bf8181d
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/output/index.html
@@ -0,0 +1,3482 @@
+
+<!DOCTYPE html
+  PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml"
+      xmlns:ucdxml="http://unicode.org/ns/2001/ucdxml">
+   <head>
+      <meta http-equiv="content-type" content="text/html; charset=UTF-8"/>
+      <link rel="stylesheet"
+            type="text/css"
+            href="https://www.unicode.org/reports/reports-v2.css"/>
+      <title>UAX #42: Unicode Character Database in XML</title>
+   </head>
+   <body style="background-color:#ffffff">
+      <table class="header" cellpadding="0" cellspacing="0" width="100%">
+         <tbody>
+            <tr>
+               <td class="icon">
+                  <a href="https://www.unicode.org/">
+                     <img style="vertical-align:middle;border:0"
+                          alt="[Unicode]"
+                          src="https://www.unicode.org/webscripts/logo60s2.gif"
+                          height="33"
+                          width="34"/>
+                  </a> <a class="bar" href="https://www.unicode.org/reports/">Technical Reports</a>
+               </td>
+            </tr>
+            <tr>
+               <td class="gray"> </td>
+            </tr>
+         </tbody>
+      </table>
+      <div class="body">
+         <h2 style="text-align:center">
+            <span style="background-color: #ffff00; border-style:dotted; border-width:1px">Proposed Update</span> Unicode® Standard Annex #42</h2>
+         <h1 style="text-align:center">Unicode Character Database in XML</h1>
+         <table class="simple" width="90%">
+            <tbody>
+               <tr>
+                  <td valign="top" width="20%">Version</td>
+                  <td valign="top">Unicode <span style="background-color: #ffff00; border-style:dotted; border-width:1px">16.0.0</span>
+                  </td>
+               </tr>
+               <tr>
+                  <td valign="top">
+                Editor
+              </td>
+                  <td valign="top">
+            John Wilcock<br/>
+                  </td>
+               </tr>
+               <tr>
+                  <td valign="top">Date</td>
+                  <td valign="top">
+                     <span style="background-color: #ffff00; border-style:dotted; border-width:1px">2024-08-15</span>
+                  </td>
+               </tr>
+               <tr>
+                  <td valign="top">This Version</td>
+                  <td valign="top">
+                     <span style="background-color: #ffff00; border-style:dotted; border-width:1px">
+                        <a href="https://www.unicode.org/reports/tr42/tr42-36.html">https://www.unicode.org/reports/tr42/tr42-36.html</a>
+                     </span>
+                  </td>
+               </tr>
+               <tr>
+                  <td valign="top">Previous Version</td>
+                  <td valign="top">
+                     <span style="background-color: #ffff00; border-style:dotted; border-width:1px">
+                        <a href="https://www.unicode.org/reports/tr42/tr42-34.html">https://www.unicode.org/reports/tr42/tr42-34.html</a>
+                     </span>
+                  </td>
+               </tr>
+               <tr>
+                  <td valign="top">Latest Version</td>
+                  <td valign="top">
+                     <a href="https://www.unicode.org/reports/tr42/">https://www.unicode.org/reports/tr42/</a>
+                  </td>
+               </tr>
+               <tr>
+                  <td valign="top">Latest Proposed Update</td>
+                  <td valign="top">
+                     <a href="https://www.unicode.org/reports/tr42/proposed.html">https://www.unicode.org/reports/tr42/proposed.html</a>
+                  </td>
+               </tr>
+               <tr>
+                  <td valign="top">Schema</td>
+                  <td valign="top">
+                     <span style="background-color: #ffff00; border-style:dotted; border-width:1px">
+                        <a href="https://www.unicode.org/reports/tr42/tr42-36.rnc">https://www.unicode.org/reports/tr42/tr42-36.rnc</a>
+                     </span>
+                  </td>
+               </tr>
+               <tr>
+                  <td valign="top">Revision</td>
+                  <td valign="top">
+                     <a href="#Modifications">
+                        <span style="background-color: #ffff00; border-style:dotted; border-width:1px">36</span>
+                     </a>
+                  </td>
+               </tr>
+            </tbody>
+         </table>
+         <h4 style="margin-top: 1em;">Summary</h4>
+         <p>
+            <i>This annex describes an XML representation of the Unicode Character Database.</i>
+         </p>
+         <h4>
+            <i>Status</i>
+         </h4>
+         <p style="background-color: #ffff00; border-style:dotted; border-width:1px">
+            <i>This is a <b>
+                  <span style="color:#ff0000">draft</span>
+               </b> document which may be updated, replaced, or
+            superseded by other documents at any time. Publication does not imply endorsement by the Unicode
+            Consortium.  This is not a stable document; it is inappropriate to cite this document as other than a
+            work in progress.</i>
+         </p>
+         <blockquote>
+            <p>
+               <i>
+                  <b>A Unicode Standard Annex (UAX)</b> forms an integral part of the Unicode Standard, but is
+            published online as a separate document. The Unicode Standard may require conformance to normative
+            content in a Unicode Standard Annex, if so specified in the Conformance chapter of that version of the
+            Unicode Standard. The version number of a UAX document corresponds to the version of the Unicode Standard
+            of which it forms a part.</i>
+            </p>
+         </blockquote>
+         <p>
+            <i>Please submit corrigenda and other comments with the online reporting form [<a href="https://www.unicode.org/reporting.html">Feedback</a>]. Related information that is useful in
+          understanding this annex is found in Unicode Standard Annex #41, “<a href="https://www.unicode.org/reports/tr41/tr41-32.html">Common References for Unicode Standard
+            Annexes.</a>” For the latest version of the Unicode Standard, see [<a href="https://www.unicode.org/versions/latest/">Unicode</a>]. For a list of current Unicode
+          Technical Reports, see [<a href="https://www.unicode.org/reports/">Reports</a>]. For more information about
+          versions of the Unicode Standard, see [<a href="https://www.unicode.org/versions/">Versions</a>]. For any
+          errata which may apply to this annex, see [<a href="https://www.unicode.org/errata/">Errata</a>].</i>
+         </p>
+         <h4>Contents</h4>
+         <ul class="toc">
+            <li>1    <a href="#d1e1734">Introduction</a>
+            </li>
+            <li>2    <a href="#d1e1763">Overall schema</a>
+               <ul class="toc">
+                  <li>2.1    <a href="#d1e1769">General principles</a>
+                  </li>
+                  <li>2.2    <a href="#d1e1806">Namespace</a>
+                  </li>
+                  <li>2.3    <a href="#d1e1823">Datatypes</a>
+                  </li>
+                  <li>2.4    <a href="#d1e1845">Root Element</a>
+                  </li>
+                  <li>2.5    <a href="#d1e1862">Common attributes</a>
+                  </li>
+                  <li>2.6    <a href="#d1e1880">Ordering of elements</a>
+                  </li>
+               </ul>
+            </li>
+            <li>3    <a href="#d1e1897">Description</a>
+            </li>
+            <li>4    <a href="#d1e1922">Repertoire</a>
+               <ul class="toc">
+                  <li>4.1    <a href="#d1e1941">Sets of code points</a>
+                  </li>
+                  <li>4.2    <a href="#d1e1972">Code point types</a>
+                  </li>
+                  <li>4.3    <a href="#d1e2000">Group</a>
+                  </li>
+                  <li>4.4    <a href="#d1e2056">Properties</a>
+                     <ul class="toc">
+                        <li>4.4.1    <a href="#d1e2085">Age property</a>
+                        </li>
+                        <li>4.4.2    <a href="#d1e2100">Name properties</a>
+                        </li>
+                        <li>4.4.3    <a href="#d1e2151">Name Alias properties</a>
+                        </li>
+                        <li>4.4.4    <a href="#d1e2168">Block property</a>
+                        </li>
+                        <li>4.4.5    <a href="#d1e2185">General Category</a>
+                        </li>
+                        <li>4.4.6    <a href="#d1e2201">Combining properties</a>
+                        </li>
+                        <li>4.4.7    <a href="#d1e2219">Bidirectionality properties</a>
+                        </li>
+                        <li>4.4.8    <a href="#d1e2277">Decomposition properties</a>
+                        </li>
+                        <li>4.4.9    <a href="#d1e2337">Numeric Properties</a>
+                        </li>
+                        <li>4.4.10    <a href="#d1e2357">Joining properties</a>
+                        </li>
+                        <li>4.4.11    <a href="#d1e2388">Linebreak properties</a>
+                        </li>
+                        <li>4.4.12    <a href="#d1e2406">East Asian Width property</a>
+                        </li>
+                        <li>4.4.13    <a href="#d1e2421">Case properties</a>
+                        </li>
+                        <li>4.4.14    <a href="#d1e2513">Script properties</a>
+                        </li>
+                        <li>4.4.15    <a href="#d1e2531">ISO Comment properties</a>
+                        </li>
+                        <li>4.4.16    <a href="#d1e2546">Hangul properties</a>
+                        </li>
+                        <li>4.4.17    <a href="#d1e2573">Indic properties</a>
+                        </li>
+                        <li>4.4.18    <a href="#d1e2612">Identifier and Pattern and programming language properties</a>
+                        </li>
+                        <li>4.4.19    <a href="#d1e2652">Properties related to function and graphic characteristics</a>
+                        </li>
+                        <li>4.4.20    <a href="#d1e2712">Properties related to boundaries</a>
+                        </li>
+                        <li>4.4.21    <a href="#d1e2741">Properties related to ideographs</a>
+                        </li>
+                        <li>4.4.22    <a href="#d1e2769">Miscellaneous properties</a>
+                        </li>
+                        <li>4.4.23    <a href="#d1e2788">Unihan properties</a>
+                        </li>
+                        <li>4.4.24    <a href="#d1e2801">Tangut data</a>
+                        </li>
+                        <li>4.4.25    <a href="#d1e2818">Nushu data</a>
+                        </li>
+                        <li>4.4.26    <a href="#d1e2835">Emoji properties</a>
+                        </li>
+                     </ul>
+                  </li>
+               </ul>
+            </li>
+            <li>5    <a href="#d1e2864">Blocks</a>
+            </li>
+            <li>6    <a href="#d1e2884">Named Sequences</a>
+            </li>
+            <li>7    <a href="#d1e2911">Normalization Corrections</a>
+            </li>
+            <li>8    <a href="#d1e2932">Standardized Variants</a>
+            </li>
+            <li>9    <a href="#d1e2952">CJK Radicals</a>
+            </li>
+            <li>10    <a href="#d1e2972">Emoji sources</a>
+            </li>
+            <li>11    <a href="#d1e2995">Do Not Emit</a>
+            </li>
+            <li>12    <a href="#d1e3014">The full schema</a>
+            </li>
+            <li>13    <a href="#d1e3064">Examples</a>
+            </li>
+            <li>
+               <a href="#d1e3076">Acknowledgments</a>
+            </li>
+            <li>
+               <a href="#Modifications">Modifications</a>
+            </li>
+         </ul>
+         <hr/>
+         <h2>
+            <a name="d1e1734">1 Introduction</a>
+         </h2>
+         <p>In working on Unicode implementations, it is often useful to access the full content of the Unicode
+            Character Database (UCD). For example, in establishing mappings from characters to glyphs in fonts, it is
+            convenient to see the character scalar value, the character name, the character East Asian width, along with
+            the shape and metrics of the proposed glyph to map to; looking at all this data simultaneously helps in
+            evaluating the mapping.
+        </p>
+         <p>Directly accessing the data files that constitute the UCD is sometimes a daunting proposition. The data is
+            dispersed in a number of files of various formats, and there are just enough peculiarities (all justified by
+            the processing power available at the time the UCD representation was designed) to require a fairly intimate
+            knowledge of the data format itself, in addition to the meaning of the data.
+        </p>
+         <p>Many programming environments (for example, Java or ICU) do give access to the UCD. However, those
+            environments tend to lag behind releases of the standard, or support only some of the UCD content.
+        </p>
+         <p>Unibook is a wonderful tool to explore the UCD and in many cases is just the ticket; however, it is
+            difficult to use when the task at hand has not been built-in, or when non-UCD data is to be displayed as
+            well.
+        </p>
+         <p>This annex presents an alternative representation of the UCD, which is meant to overcome these
+            difficulties. We have chosen an XML representation, because parsing becomes a non-issue: there are a number
+            of XML parsers freely available, and using them is often fairly easy. In addition, there are freely
+            available tools that can perform powerful operations on XML data; for example, XPATH and XQUERY engines can
+            be thought of as a “grep” for XML data and XSLT engines can be thought of as
+            “awk” for XML data.
+        </p>
+         <p>It is important to note that we are interested in exploring the content of the UCD, rather than in using
+            the UCD data to process character streams. Thus, we are not concerned so much by the speed of processing or
+            the size of our representation.
+        </p>
+         <p>Our representation supports the creation of documents that represent only parts of the UCD, either by not
+            representing all the characters, or by not representing all the properties. This can be useful when only
+            some of the data is needed.
+        </p>
+         <p>This annex presents only the XML representation format of the UCD. The data itself is part of the <a href="https://www.unicode.org/reports/tr41/tr41-34.html#UCD">Unicode
+            Character Database</a>.
+        </p>
+         <h2>
+            <a name="d1e1763">2 Overall schema</a>
+         </h2>
+         <h3>
+            <a name="d1e1769">2.1 General principles</a>
+         </h3>
+         <p>Our schema can be used to create and validate documents which are intended to represent properties of
+                Unicode code points, blocks, named sequences, normalization corrections, standardized variants, CJK
+                radicals and emoji sources. A document may represent the values actually assigned in a given version of
+                the UCD, or it may represent a draft version of the UCD, or a private agreement on Private Use
+                characters. The validity of a XML document with respect to the schema defined in this annex does not
+                assert anything about the correctness of the values.
+            </p>
+         <p>Valid documents may provide values for only some of the code points, or some of the Unicode
+                properties. Furthermore, they may also incorporate non-Unicode properties.
+            </p>
+         <p>Our schema is defined using English. However, a useful subset of the validity constraints can be
+                captured using a schema language, thereby simplifying the task of validating documents. We have chosen
+                Relax NG [<a href="https://www.unicode.org/reports/tr41/tr41-34.html#ISO19757">ISO 19757</a>],
+                in the compact syntax , as the schema language. It is important to stress that the schema which is
+                defined in English imposes more constraints on the documents than can be validated with the Relax NG
+                schema.
+            </p>
+         <p>An important characteristic of Relax NG is that its schemas do not modify or augment the infoset of
+                the documents. Therefore, it is possible to process our XML representation without using the schema.
+                Also, the schema is relatively straightforward and can be converted mechanically to other schema
+                languages.
+            </p>
+         <p>While our XML representation is not intended to be used during processing of characters and strings,
+                it is still a design principle for our schema to support the relatively efficient representation of the
+                UCD. This is achieved by an inheritance mechanism, similar to property inheritance in CSS or in XSL:FO
+                (see section 4.3 Group).
+            </p>
+         <p>Many invariants impose constraints on the values of the different properties for a given code point.
+                For example, if the value of the Numeric Type property is None, then the value of the
+                Numeric Value property should be the empty string; and if the value of the Other
+                Alphabetic property is true, then the value of the Alphabetic property should be
+                true. Those invariants are not captured in the schema.
+            </p>
+         <h3>
+            <a name="d1e1806">2.2 Namespace</a>
+         </h3>
+         <p>The namespace for our elements is “http://www.unicode.org/ns/2003/ucd/1.0”. Our
+                attributes are in the empty namespace.
+            </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e1812">[namespace declaration,
+        1]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  default namespace ucd = "http://www.unicode.org/ns/2003/ucd/1.0"
+</tt>
+         </p>
+         <p>In all our examples, we assume that this namespace is the default one.
+            </p>
+         <h3>
+            <a name="d1e1823">2.3 Datatypes</a>
+         </h3>
+         <p>We use a standard XML Schema datatypes:</p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e1829">[datatypes declaration,
+        2]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  # default; datatypes xsd = "http://www.w3.org/2001/XMLSchema-datatypes"
+</tt>
+         </p>
+         <p>Characters are pervasive in the UCD, and will need to be represented. Representing characters directly
+                by themselves would seem the most obvious choice; for example, we could express that the decomposition
+                of U+00E8 is “&amp;#x0065;&amp;#x0300;”, that is have exactly two characters in (the
+                infoset of) the XML document. However, the current XML specification limits the set of characters
+                that can be part of a document. Another problem is that the various tools (XML parser, XPATH engine,
+                etc.) may equate U+00E8 with U+0065 U+0300, thus making it difficult to figure out which of the two
+                sequences is contained in the database (which is sometimes important for our purposes). Therefore, we
+                chose instead to represent characters by their code points; we follow the usual convention of four to
+                six hexadecimal digits (uppercase) and code points in a sequence separated by space; for example, the
+                decomposition of U+00E8 will be represented by the nine characters “0065 0300” in the
+                infoset.
+            </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e1837">[datatype for code points,
+        3]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  single-code-point = xsd:string { pattern = "(|[1-9A-F]|(10))[0-9A-F]{4}" }
+
+  one-or-more-code-points = list { single-code-point + }
+  zero-or-more-code-points = list { single-code-point * }
+  two-code-points = list { single-code-point, single-code-point }
+</tt>
+         </p>
+         <h3>
+            <a name="d1e1845">2.4 Root Element</a>
+         </h3>
+         <p>The root element of valid documents is a <tt>ucd</tt>.
+            </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e1854">[schema start,
+        4]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  start =
+    element ucd { ucd.content }
+</tt>
+         </p>
+         <h3>
+            <a name="d1e1862">2.5 Common attributes</a>
+         </h3>
+         <p>A large number of properties are boolean. We uniformly use the values <tt>Y</tt> and
+                <tt>N</tt> for those:
+            </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e1871">[boolean,
+        5]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  boolean = "Y" | "N"
+</tt>
+         </p>
+         <h3>
+            <a name="d1e1880">2.6 Ordering of elements</a>
+         </h3>
+         <p>In elements that hold lists of child elements, such as <tt>repertoire</tt>,
+                <tt>group</tt>, or <tt>standardized-variants</tt>, the schema does not require that the
+                child elements be in any particular order.
+            </p>
+         <h2>
+            <a name="d1e1897">3 Description</a>
+         </h2>
+         <p>The root element may have a <tt>description</tt> child element, which in turn contains any string,
+            which is meant to describe what the XML document purports to describe.
+        </p>
+         <p>It is recommended that if the document purports to represent the UCD of some Unicode version, the
+            <tt>description</tt> be selected in accord with the rules listed in <a href="https://www.unicode.org/reports/tr41/tr41-34.html#Versions">[Versions]</a>; and
+            conversely, that documents which do not purport to represent the UCD be described as such.
+        </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e1914">[description,
+        6]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  ucd.content &amp;=
+    element description { text }?
+</tt>
+         </p>
+         <h2>
+            <a name="d1e1922">4 Repertoire</a>
+         </h2>
+         <p>The <tt>repertoire</tt> child element of the <tt>ucd</tt> element describes the code points and
+            their properties. As we will see shortly, code points can be described individually or as part of a group:
+        </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e1933">[repertoire,
+        7]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  ucd.content &amp;=
+    element repertoire { (code-point | group) + }?
+</tt>
+         </p>
+         <h3>
+            <a name="d1e1941">4.1 Sets of code points</a>
+         </h3>
+         <p>It is often the case that successive code points have the same property values, for a given set of
+                properties. The most striking example is that of an unallocated plane, where all but the last two
+                code points are reserved and have the same property values. Another example is the URO (U+4E00
+                .. U+9FA5) where all the code points have the same property values if we ignore their name and their
+                Unihan properties.
+            </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e1947">[Set of code points,
+        8]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  set-of-code-points =
+     attribute cp { single-code-point }
+   | ( attribute first-cp { single-code-point },
+       attribute last-cp  { single-code-point } )
+</tt>
+         </p>
+         <p>This observation suggests that it is profitable to represent sets of code points which share the
+                same properties, rather than individual code points. To make the representation of the sets simple,
+                we restrict them to be segments in the code point space, that is a set is defined by the first and
+                last code point it contains. Those are captured by the attributes <tt>first-cp</tt> and <tt>
+                    last-cp</tt>. The attribute <tt>cp</tt> is a shorthand notation for the case where the set
+                has a single code point.
+            </p>
+         <p>In the <tt>repertoire</tt>, there must be at most one <tt>code-point</tt>
+                element for a given code point.
+            </p>
+         <h3>
+            <a name="d1e1972">4.2 Code point types</a>
+         </h3>
+         <p>When thinking about Unicode code points, it is useful to split them into four types:
+            </p>
+                those assigned to abstract characters (PUA or not)
+                the noncharacters
+                the surrogate code points
+                the reserved code points
+            <p>This leads to four elements to describe sets of code points:
+            </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e1992">[Code points,
+        9]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point |=
+    element reserved {
+      set-of-code-points,
+      code-point-attributes }
+
+  code-point |=
+    element noncharacter {
+      set-of-code-points,
+      code-point-attributes }
+
+  code-point |=
+    element surrogate {
+      set-of-code-points,
+      code-point-attributes }
+
+  code-point |=
+    element char {
+      set-of-code-points,
+      code-point-attributes }
+</tt>
+         </p>
+         <h3>
+            <a name="d1e2000">4.3 Group</a>
+         </h3>
+         <p>While we already recognized the situation where a set of code points have exactly the same set of
+                property values, another common situation is that of code points which have almost all the same
+                property values.
+            </p>
+         <p>For example, the characters U+1740 BUHID LETTER A .. U+1753 BUHID VOWEL SIGN U all have the age
+                “3.2”, and all have the script “Buhd”. On the one hand, it is convenient
+                to support data files in which those properties are explicitly listed with every code point, at this
+                makes answering questions like “what is the age of U+1749?” easier, because that data
+                is expressed right there. On the other hand, this leads to rather large data files, and it also tends
+                to obscure the differences between similar characters.
+            </p>
+         <p>Our representation accounts for this situation with the notion of groups. A
+                <tt>group</tt> element is simply a container of code points that also holds default values for
+                the properties. If a code point inside a <tt>group</tt> does not list explicitly a property but the
+                <tt>group</tt> lists it, then the code point inherits that property from its
+                <tt>group</tt>. For example, the fragment with explicit properties:
+            </p>
+         <pre>
+    &lt;char cp="1740" age="3.2" na="BUHID LETTER A" gc="Lo" sc="Buhd"/&gt;
+    &lt;char cp="1741" age="3.2" na="BUHID LETTER I" gc="Lo" sc="Buhd"/&gt;
+    &lt;char cp="1752" age="3.2" na="BUHID VOWEL SIGN I" gc="Mn" sc="Buhd"/&gt;
+    &lt;char cp="1820" age="3.0" na="MONGOLIAN LETTER A" gc="Lo" sc="Mong"/&gt;</pre>
+         <p>is equivalent to this fragment which uses a <tt>group</tt>:
+            </p>
+         <pre>
+    &lt;group age="3.2" gc="Lo" sc="Buhd"&gt;
+        &lt;char cp="1740" na="BUHID LETTER A"/&gt;
+        &lt;char cp="1741" na="BUHID LETTER I"/&gt;
+        &lt;char cp="1752" na="BUHID VOWEL SIGN I" gc="Mn"/&gt;
+        &lt;char cp="1820" age="3.0" na="MONGOLIAN LETTER A" sc="Mong"/&gt;
+    &lt;/group&gt;</pre>
+         <p>The element for U+1740 does not have the <tt>age</tt> attribute, and it therefore inherits it
+                from its enclosing <tt>group</tt> element, that is “3.2”. On the other hand,
+                the element for U+1820 does have this attribute, so the value is “3.0”.
+            </p>
+         <p>As this example illustrates, the notion of <tt>group</tt> does not necessarily align with the
+                notion of Unicode block. It is entirely defined and limited to our representation. In particular, the
+                value of a property for a code point can always be determined from the XML document alone, assuming
+                that this property and this code point are expressed at all. Of course, one may create an XML
+                representation where the groups happen to coincide with the Unicode blocks.
+            </p>
+         <p>Groups cannot be nested. The motivation for this limitation is to make the life of consumers
+                easier: either a property is defined by the element for a code point, or it is defined by the
+                immediately enclosing <tt>group</tt> element.
+            </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2047">[groups,
+        10]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  group =
+    element group {
+      code-point-attributes,
+      code-point* }
+</tt>
+         </p>
+         <h3>
+            <a name="d1e2056">4.4 Properties</a>
+         </h3>
+         <p>Each property, except for the Special_Case_Condition and Name_Alias
+                properties, is represented by an attribute. In an XML data file, the absence of an attribute (may be
+                only on some <code>code-point</code>s) means that the document does not express the value
+                of the corresponding property. Conversely, the presence of an attribute is an expression of the
+                corresponding property value; the implied null value is represented by the empty string.
+            </p>
+         <p>The Name_Alias property is represented by zero or more <tt>name-alias</tt> child
+                elements. Unlike the situation for properties represented by attributes, it is not possible to determine
+                whether all the aliases have been represented in a data file by inspecting that data file.
+            </p>
+         <p>The name of an attribute is the abbreviated name of the property as given in the file
+                PropertyAliases.txt in the corresponding version of the UCD. For the Unihan
+                properties, the name is that given in the various versions of the Unihan database.
+            </p>
+         <p>For catalog and enumerated properties, the values are those listed in the file
+                PropertyValueAliases.txt in the corresponding version of the UCD; if there is an abbreviated
+                name, it is used, otherwise the long name is used.
+            </p>
+         <p>Note that the set of possible values for a property captured in this schema may change from one
+                version to the next.
+            </p>
+         <h4>
+            <a name="d1e2085">4.4.1 Age property</a>
+         </h4>
+         <p>The <tt>age</tt> attribute captures the version of Unicode in which a code point was
+                    assigned to an abstract character, or made a surrogate or non-character.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2092">[age attribute,
+        11]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute age { "1.1"
+                  | "2.0" | "2.1"
+                  | "3.0" | "3.1" | "3.2"
+                  | "4.0" | "4.1"
+                  | "5.0" | "5.1" | "5.2"
+                  | "6.0" | "6.1" | "6.2" | "6.3"
+                  | "7.0"
+                  | "8.0"
+                  | "9.0"
+                  | "10.0"
+                  | "11.0"
+                  | "12.0" | "12.1"
+                  | "13.0"
+                  | "14.0"
+                  | "15.0" | "15.1"
+                  | "16.0"
+                  | "17.0"
+                  | "unassigned"
+                  }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2100">4.4.2 Name properties</a>
+         </h4>
+         <p>There are two name properties: the name given by the current version of the standard
+                    (<tt>na</tt>), and possibly the name this character had in version 1.0 of the standard
+                    (<tt>na1</tt>).
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2109">[na attribute,
+        12]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute na { "" |
+                   "CJK UNIFIED IDEOGRAPH-#" |
+                   "CJK COMPATIBILITY IDEOGRAPH-#" |
+                   "EGYPTIAN HIEROGLYPH-#" |
+                   "TANGUT IDEOGRAPH-#" |
+                   "KHITAN SMALL SCRIPT CHARACTER-#" |
+                   "NUSHU CHARACTER-#" |
+                   xsd:string { pattern="[a-zA-Z0-9]+(( -|- |[\-_ ])[a-zA-Z0-9]+)*" }
+                 }?
+</tt>
+         </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2112">[na1 attribute,
+        13]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute na1 { "" | xsd:string { pattern="[a-zA-Z0-9]+([\-_ ][a-zA-Z0-9]+)*( \(.*\))?" } }?
+</tt>
+         </p>
+         <p>The majority of the characters in Unicode have a name which is of the form CJK UNIFIED
+                    IDEOGRAPH-<code>&lt;code point&gt;</code>. It also happens that character names cannot
+                    contain the character U+0023 # NUMBER SIGN, so we adopted the following convention: if a
+                    code point has the attribute <tt>na</tt> (either directly or by inheritance from an enclosing
+                    group), then occurrences of the character # in the name are to be interpreted as the value of the
+                    code point. For example:
+                </p>
+         <pre>
+    &lt;char cp="3400" na="CJK UNIFIED IDEOGRAPH-3400"/&gt;</pre>
+         <p>and</p>
+         <pre>
+    &lt;char cp="3400" na="CJK UNIFIED IDEOGRAPH-#"/&gt;</pre>
+         <p>are equivalent. The # can be in any position in the value of the <tt>na</tt>
+                    attribute. The convention also applies just as well to a set of multiple code points:
+                </p>
+         <pre>
+    &lt;char cp="3400" na="CJK UNIFIED IDEOGRAPH-3400"/&gt;
+    &lt;char cp="3401" na="CJK UNIFIED IDEOGRAPH-3401"/&gt;</pre>
+         <p>is equivalent to</p>
+         <pre>
+    &lt;char cp="3400" na="CJK UNIFIED IDEOGRAPH-#"/&gt;
+    &lt;char cp="3401" na="CJK UNIFIED IDEOGRAPH-#"/&gt;</pre>
+         <p>which in turn is equivalent to:</p>
+         <pre>
+    &lt;char first-cp="3400" last-cp="3401" na="CJK UNIFIED IDEOGRAPH-#"/&gt;</pre>
+         <h4>
+            <a name="d1e2151">4.4.3 Name Alias properties</a>
+         </h4>
+         <p>The Name_Alias property is represented by zero or more <tt>name-alias</tt>
+                    child elements:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2160">[name-alias element,
+        14]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    element name-alias {
+      attribute alias { xsd:string { pattern="[a-zA-Z0-9]+(( -|- |[\-_ ])[a-zA-Z0-9]+)*" } }?,
+      attribute type  { "abbreviation" | "alternate"
+                      | "control" | "correction"
+                      | "figment"
+                      }? } *
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2168">4.4.4 Block property</a>
+         </h4>
+         <p>The Block property is represented by the <tt>blk</tt> attribute:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2177">[blk attribute,
+        15]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute blk { "Adlam"
+                  | "Aegean_Numbers"
+                  | "Ahom"
+                  | "Alchemical"
+                  | "Alphabetic_PF"
+                  | "Anatolian_Hieroglyphs"
+                  | "Ancient_Greek_Music"
+                  | "Ancient_Greek_Numbers"
+                  | "Ancient_Symbols"
+                  | "Arabic"
+                  | "Arabic_Ext_A"
+                  | "Arabic_Ext_B"
+                  | "Arabic_Ext_C"
+                  | "Arabic_Math"
+                  | "Arabic_PF_A"
+                  | "Arabic_PF_B"
+                  | "Arabic_Sup"
+                  | "Armenian"
+                  | "Arrows"
+                  | "ASCII"
+                  | "Avestan"
+                  | "Balinese"
+                  | "Bamum"
+                  | "Bamum_Sup"
+                  | "Bassa_Vah"
+                  | "Batak"
+                  | "Bengali"
+                  | "Bhaiksuki"
+                  | "Block_Elements"
+                  | "Bopomofo"
+                  | "Bopomofo_Ext"
+                  | "Box_Drawing"
+                  | "Brahmi"
+                  | "Braille"
+                  | "Buginese"
+                  | "Buhid"
+                  | "Byzantine_Music"
+                  | "Carian"
+                  | "Caucasian_Albanian"
+                  | "Chakma"
+                  | "Cham"
+                  | "Cherokee"
+                  | "Cherokee_Sup"
+                  | "Chess_Symbols"
+                  | "Chorasmian"
+                  | "CJK"
+                  | "CJK_Compat"
+                  | "CJK_Compat_Forms"
+                  | "CJK_Compat_Ideographs"
+                  | "CJK_Compat_Ideographs_Sup"
+                  | "CJK_Ext_A"
+                  | "CJK_Ext_B"
+                  | "CJK_Ext_C"
+                  | "CJK_Ext_D"
+                  | "CJK_Ext_E"
+                  | "CJK_Ext_F"
+                  | "CJK_Ext_G"
+                  | "CJK_Ext_H"
+                  | "CJK_Ext_I"
+                  | "CJK_Radicals_Sup"
+                  | "CJK_Strokes"
+                  | "CJK_Symbols"
+                  | "Compat_Jamo"
+                  | "Control_Pictures"
+                  | "Coptic"
+                  | "Coptic_Epact_Numbers"
+                  | "Counting_Rod"
+                  | "Cuneiform"
+                  | "Cuneiform_Numbers"
+                  | "Currency_Symbols"
+                  | "Cypriot_Syllabary"
+                  | "Cypro_Minoan"
+                  | "Cyrillic"
+                  | "Cyrillic_Ext_A"
+                  | "Cyrillic_Ext_B"
+                  | "Cyrillic_Ext_C"
+                  | "Cyrillic_Ext_D"
+                  | "Cyrillic_Sup"
+                  | "Deseret"
+                  | "Devanagari"
+                  | "Devanagari_Ext"
+                  | "Devanagari_Ext_A"
+                  | "Diacriticals"
+                  | "Diacriticals_Ext"
+                  | "Diacriticals_For_Symbols"
+                  | "Diacriticals_Sup"
+                  | "Dingbats"
+                  | "Dives_Akuru"
+                  | "Dogra"
+                  | "Domino"
+                  | "Duployan"
+                  | "Early_Dynastic_Cuneiform"
+                  | "Egyptian_Hieroglyph_Format_Controls"
+                  | "Egyptian_Hieroglyphs"
+                  | "Egyptian_Hieroglyphs_Ext_A"
+                  | "Elbasan"
+                  | "Elymaic"
+                  | "Emoticons"
+                  | "Enclosed_Alphanum"
+                  | "Enclosed_Alphanum_Sup"
+                  | "Enclosed_CJK"
+                  | "Enclosed_Ideographic_Sup"
+                  | "Ethiopic"
+                  | "Ethiopic_Ext"
+                  | "Ethiopic_Ext_A"
+                  | "Ethiopic_Ext_B"
+                  | "Ethiopic_Sup"
+                  | "Garay"
+                  | "Geometric_Shapes"
+                  | "Geometric_Shapes_Ext"
+                  | "Georgian"
+                  | "Georgian_Ext"
+                  | "Georgian_Sup"
+                  | "Glagolitic"
+                  | "Glagolitic_Sup"
+                  | "Gothic"
+                  | "Grantha"
+                  | "Greek"
+                  | "Greek_Ext"
+                  | "Gujarati"
+                  | "Gunjala_Gondi"
+                  | "Gurmukhi"
+                  | "Gurung_Khema"
+                  | "Half_And_Full_Forms"
+                  | "Half_Marks"
+                  | "Hangul"
+                  | "Hanifi_Rohingya"
+                  | "Hanunoo"
+                  | "Hatran"
+                  | "Hebrew"
+                  | "High_PU_Surrogates"
+                  | "High_Surrogates"
+                  | "Hiragana"
+                  | "IDC"
+                  | "Ideographic_Symbols"
+                  | "Imperial_Aramaic"
+                  | "Indic_Number_Forms"
+                  | "Indic_Siyaq_Numbers"
+                  | "Inscriptional_Pahlavi"
+                  | "Inscriptional_Parthian"
+                  | "IPA_Ext"
+                  | "Jamo"
+                  | "Jamo_Ext_A"
+                  | "Jamo_Ext_B"
+                  | "Javanese"
+                  | "Kaithi"
+                  | "Kaktovik_Numerals"
+                  | "Kana_Ext_A"
+                  | "Kana_Ext_B"
+                  | "Kana_Sup"
+                  | "Kanbun"
+                  | "Kangxi"
+                  | "Kannada"
+                  | "Katakana"
+                  | "Katakana_Ext"
+                  | "Kawi"
+                  | "Kayah_Li"
+                  | "Kharoshthi"
+                  | "Khitan_Small_Script"
+                  | "Khmer"
+                  | "Khmer_Symbols"
+                  | "Khojki"
+                  | "Khudawadi"
+                  | "Kirat_Rai"
+                  | "Lao"
+                  | "Latin_1_Sup"
+                  | "Latin_Ext_A"
+                  | "Latin_Ext_Additional"
+                  | "Latin_Ext_B"
+                  | "Latin_Ext_C"
+                  | "Latin_Ext_D"
+                  | "Latin_Ext_E"
+                  | "Latin_Ext_F"
+                  | "Latin_Ext_G"
+                  | "Lepcha"
+                  | "Letterlike_Symbols"
+                  | "Limbu"
+                  | "Linear_A"
+                  | "Linear_B_Ideograms"
+                  | "Linear_B_Syllabary"
+                  | "Lisu"
+                  | "Lisu_Sup"
+                  | "Low_Surrogates"
+                  | "Lycian"
+                  | "Lydian"
+                  | "Mahajani"
+                  | "Mahjong"
+                  | "Makasar"
+                  | "Malayalam"
+                  | "Mandaic"
+                  | "Manichaean"
+                  | "Marchen"
+                  | "Masaram_Gondi"
+                  | "Math_Alphanum"
+                  | "Math_Operators"
+                  | "Mayan_Numerals"
+                  | "Medefaidrin"
+                  | "Meetei_Mayek"
+                  | "Meetei_Mayek_Ext"
+                  | "Mende_Kikakui"
+                  | "Meroitic_Cursive"
+                  | "Meroitic_Hieroglyphs"
+                  | "Miao"
+                  | "Misc_Arrows"
+                  | "Misc_Math_Symbols_A"
+                  | "Misc_Math_Symbols_B"
+                  | "Misc_Pictographs"
+                  | "Misc_Symbols"
+                  | "Misc_Technical"
+                  | "Modi"
+                  | "Modifier_Letters"
+                  | "Modifier_Tone_Letters"
+                  | "Mongolian"
+                  | "Mongolian_Sup"
+                  | "Mro"
+                  | "Multani"
+                  | "Music"
+                  | "Myanmar"
+                  | "Myanmar_Ext_A"
+                  | "Myanmar_Ext_B"
+                  | "Myanmar_Ext_C"
+                  | "Nabataean"
+                  | "Nag_Mundari"
+                  | "Nandinagari"
+                  | "NB"
+                  | "New_Tai_Lue"
+                  | "Newa"
+                  | "NKo"
+                  | "Number_Forms"
+                  | "Nushu"
+                  | "Nyiakeng_Puachue_Hmong"
+                  | "OCR"
+                  | "Ogham"
+                  | "Ol_Chiki"
+                  | "Ol_Onal"
+                  | "Old_Hungarian"
+                  | "Old_Italic"
+                  | "Old_North_Arabian"
+                  | "Old_Permic"
+                  | "Old_Persian"
+                  | "Old_Sogdian"
+                  | "Old_South_Arabian"
+                  | "Old_Turkic"
+                  | "Old_Uyghur"
+                  | "Oriya"
+                  | "Ornamental_Dingbats"
+                  | "Osage"
+                  | "Osmanya"
+                  | "Ottoman_Siyaq_Numbers"
+                  | "Pahawh_Hmong"
+                  | "Palmyrene"
+                  | "Pau_Cin_Hau"
+                  | "Phags_Pa"
+                  | "Phaistos"
+                  | "Phoenician"
+                  | "Phonetic_Ext"
+                  | "Phonetic_Ext_Sup"
+                  | "Playing_Cards"
+                  | "Psalter_Pahlavi"
+                  | "PUA"
+                  | "Punctuation"
+                  | "Rejang"
+                  | "Rumi"
+                  | "Runic"
+                  | "Samaritan"
+                  | "Saurashtra"
+                  | "Sharada"
+                  | "Shavian"
+                  | "Shorthand_Format_Controls"
+                  | "Siddham"
+                  | "Sinhala"
+                  | "Sinhala_Archaic_Numbers"
+                  | "Small_Forms"
+                  | "Small_Kana_Ext"
+                  | "Sogdian"
+                  | "Sora_Sompeng"
+                  | "Soyombo"
+                  | "Specials"
+                  | "Sundanese"
+                  | "Sundanese_Sup"
+                  | "Sunuwar"
+                  | "Sup_Arrows_A"
+                  | "Sup_Arrows_B"
+                  | "Sup_Arrows_C"
+                  | "Sup_Math_Operators"
+                  | "Sup_PUA_A"
+                  | "Sup_PUA_B"
+                  | "Sup_Punctuation"
+                  | "Sup_Symbols_And_Pictographs"
+                  | "Super_And_Sub"
+                  | "Sutton_SignWriting"
+                  | "Syloti_Nagri"
+                  | "Symbols_And_Pictographs_Ext_A"
+                  | "Symbols_For_Legacy_Computing"
+                  | "Symbols_For_Legacy_Computing_Sup"
+                  | "Syriac"
+                  | "Syriac_Sup"
+                  | "Tagalog"
+                  | "Tagbanwa"
+                  | "Tags"
+                  | "Tai_Le"
+                  | "Tai_Tham"
+                  | "Tai_Viet"
+                  | "Tai_Xuan_Jing"
+                  | "Takri"
+                  | "Tamil"
+                  | "Tamil_Sup"
+                  | "Tangsa"
+                  | "Tangut"
+                  | "Tangut_Components"
+                  | "Tangut_Sup"
+                  | "Telugu"
+                  | "Thaana"
+                  | "Thai"
+                  | "Tibetan"
+                  | "Tifinagh"
+                  | "Tirhuta"
+                  | "Todhri"
+                  | "Toto"
+                  | "Transport_And_Map"
+                  | "Tulu_Tigalari"
+                  | "UCAS"
+                  | "UCAS_Ext"
+                  | "UCAS_Ext_A"
+                  | "Ugaritic"
+                  | "Vai"
+                  | "Vedic_Ext"
+                  | "Vertical_Forms"
+                  | "Vithkuqi"
+                  | "VS"
+                  | "VS_Sup"
+                  | "Wancho"
+                  | "Warang_Citi"
+                  | "Yezidi"
+                  | "Yi_Radicals"
+                  | "Yi_Syllables"
+                  | "Yijing"
+                  | "Zanabazar_Square"
+                  | "Znamenny_Music"
+                  }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2185">4.4.5 General Category</a>
+         </h4>
+         <p>The general category is represented by the <tt>gc</tt> attribute.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2192">[gc attribute,
+        16]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute gc { "Cc" | "Cf" | "Cn" | "Co" | "Cs"
+                 | "Ll" | "Lm" | "Lo" | "Lt" | "Lu"
+                 | "Mc" | "Me" | "Mn"
+                 | "Nd" | "Nl" | "No"
+                 | "Pc" | "Pd" | "Pe" | "Pf" | "Pi" | "Po" | "Ps"
+                 | "Sc" | "Sk" | "Sm" | "So"
+                 | "Zl" | "Zp" | "Zs"
+                 }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2201">4.4.6 Combining properties</a>
+         </h4>
+         <p>The combining class is represented by the <tt>ccc</tt> attribute, which holds the decimal
+                    representation of the combining class.
+                </p>
+         <p>Because the set of values that this property has taken across the various versions of the UCD
+                    is rather large, our schema does not restrict the possible values to those actually used.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2211">[ccc attribute,
+        17]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute ccc { xsd:integer { minInclusive="0" maxInclusive="254" } }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2219">4.4.7 Bidirectionality properties</a>
+         </h4>
+         <p>The bidirectional class is represented by the <tt>bc</tt> attribute.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2226">[bc attribute,
+        18]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute bc { "AL" | "AN"
+                 | "B" | "BN"
+                 | "CS"
+                 | "EN" | "ES" | "ET"
+                 | "FSI"
+                 | "L" | "LRE" | "LRI" | "LRO"
+                 | "NSM"
+                 | "ON"
+                 | "PDF" | "PDI"
+                 | "R" | "RLE" | "RLI" | "RLO"
+                 | "S"
+                 | "WS"
+                 }?
+</tt>
+         </p>
+         <p>The mirrored property is represented by the <tt>Bidi_M</tt> attribute, which takes a
+                    boolean value.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2234">[Bidi_M attribute,
+        19]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute Bidi_M { boolean }?
+</tt>
+         </p>
+         <p>The <tt>bmg</tt> attribute is the code point of a character whose glyph is typically
+                    a mirrored image of the glyph for the current character.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2243">[bmg attribute,
+        20]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute bmg { "" | single-code-point }?
+</tt>
+         </p>
+         <p>Note that we do not express the “Best Fit” element recorded in BidiMirroring.txt.
+                    For one thing, it is not meant to be machine readable. More importantly, the idea underlying the
+                    mirrored glyph is delicate to use, since it makes assumptions about the design of the fonts, and
+                    the best fit goes even farther.
+                </p>
+         <p>The Bidi_Control property is represented by the <tt>Bidi_C</tt> attribute.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2255">[Bidi_C attribute,
+        21]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute Bidi_C { boolean }?
+</tt>
+         </p>
+         <p>The bidi paired bracket type and bidi paired bracket properties are represented by the
+                    <tt>bpt</tt> and <tt>bpb</tt> attributes respectively.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2266">[bpt attribute,
+        22]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute bpt { "o" | "c" | "n" }?
+</tt>
+         </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2269">[bpb attribute,
+        23]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute bpb { "#" | single-code-point }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2277">4.4.8 Decomposition properties</a>
+         </h4>
+         <p>The decomposition type and decomposition mapping properties are represented by the <tt>dt</tt>
+                    and <tt>dm</tt> attributes.
+                </p>
+         <p>Most characters have a decomposition mapping to themselves. This is very similar to the
+                    situation we encountered with names, and we adopted a similar convention: if the value of a
+                    decomposition mapping is the character itself, we use the attribute value # (U+0023 #
+                    NUMBER SIGN) as a shorthand notation; this enables those attributes to be captured in groups.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2288">[decomposition properties,
+        24]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute dt { "can" | "com" | "enc" | "fin" | "font" | "fra"
+                 | "init" | "iso" | "med" | "nar" | "nb" | "sml"
+                 | "sqr" | "sub" | "sup" | "vert" | "wide" | "none"
+                 }?
+
+  code-point-attributes &amp;=
+    attribute dm { "#" | zero-or-more-code-points }?
+</tt>
+         </p>
+         <p>The properties Composition_Exclusion and Full_Composition_Exclusion are
+                    represented by the attributes <tt>CE</tt> and <tt>Comp_Ex</tt>:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2303">[composition properties,
+        25]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute CE { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Comp_Ex { boolean }?
+</tt>
+         </p>
+         <p>The properties NFC_Quick_Check, NFD_Quick_Check,
+                    NFKC_Quick_Check, NFKD_Quick_Check, Expands_On_NFC,
+                    Expands_On_NFD, Expands_On_NFKC, Expands_On_NKFD,
+                    FC_NFKC_Closure have corresponding attributes.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2328">[quick check properties,
+        26]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute NFC_QC { "Y" | "N" | "M" }?
+
+  code-point-attributes &amp;=
+    attribute NFD_QC { "Y" | "N" }?
+
+  code-point-attributes &amp;=
+    attribute NFKC_QC { "Y" | "N" | "M" }?
+
+  code-point-attributes &amp;=
+    attribute NFKD_QC { "Y" | "N" }?
+
+
+  code-point-attributes &amp;=
+    attribute XO_NFC { boolean }?
+
+  code-point-attributes &amp;=
+    attribute XO_NFD { boolean }?
+
+  code-point-attributes &amp;=
+    attribute XO_NFKC { boolean }?
+
+  code-point-attributes &amp;=
+    attribute XO_NFKD { boolean }?
+
+
+  code-point-attributes &amp;=
+    attribute FC_NFKC { "#" | one-or-more-code-points }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2337">4.4.9 Numeric Properties</a>
+         </h4>
+         <p>The numeric type is represented by the <tt>nt</tt> attribute.
+                </p>
+         <p>The numeric value is represented by the <tt>nv</tt> attribute, represented as a whole
+                    number or a fraction.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2349">[numeric properties,
+        27]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute nt { "De" | "Di" | "Nu" | "None" }?
+
+  code-point-attributes &amp;=
+    attribute nv { "NaN" | xsd:string { pattern="-?[0-9]+(/[0-9]+)?" } }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2357">4.4.10 Joining properties</a>
+         </h4>
+         <p>The joining class of a character is represented by the <tt>jt</tt> attribute.
+                </p>
+         <p>The <tt>jg</tt> attribute is the joining group of the character.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2369">[joining properties,
+        28]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute jt { "C" | "D" | "L" | "R" | "T" | "U" }?
+
+  code-point-attributes &amp;=
+    attribute jg { "African_Feh" | "African_Noon" | "African_Qaf"
+                 | "Ain" | "Alaph" | "Alef"
+                 | "Beh" | "Beth" | "Burushaski_Yeh_Barree"
+                 | "Dal" | "Dalath_Rish"
+                 | "E"
+                 | "Farsi_Yeh" | "Fe" | "Feh" | "Final_Semkath"
+                 | "Gaf" | "Gamal"
+                 | "Hah" | "Hanifi_Rohingya_Kinna_Ya"
+                 | "Hanifi_Rohingya_Pa" | "He" | "Heh" | "Heh_Goal"
+                 | "Heth"
+                 | "Kaf" | "Kaph" | "Kashmiri_Yeh" | "Khaph"
+                 | "Knotted_Heh"
+                 | "Lam" | "Lamadh"
+                 | "Malayalam_Bha" | "Malayalam_Ja" | "Malayalam_Lla"
+                 | "Malayalam_Llla" | "Malayalam_Nga"
+                 | "Malayalam_Nna" | "Malayalam_Nnna"
+                 | "Malayalam_Nya" | "Malayalam_Ra" | "Malayalam_Ssa"
+                 | "Malayalam_Tta" | "Manichaean_Aleph"
+                 | "Manichaean_Ayin" | "Manichaean_Beth"
+                 | "Manichaean_Daleth" | "Manichaean_Dhamedh"
+                 | "Manichaean_Five" | "Manichaean_Gimel"
+                 | "Manichaean_Heth" | "Manichaean_Hundred"
+                 | "Manichaean_Kaph" | "Manichaean_Lamedh"
+                 | "Manichaean_Mem" | "Manichaean_Nun"
+                 | "Manichaean_One" | "Manichaean_Pe"
+                 | "Manichaean_Qoph" | "Manichaean_Resh"
+                 | "Manichaean_Sadhe" | "Manichaean_Samekh"
+                 | "Manichaean_Taw" | "Manichaean_Ten"
+                 | "Manichaean_Teth" | "Manichaean_Thamedh"
+                 | "Manichaean_Twenty" | "Manichaean_Waw"
+                 | "Manichaean_Yodh" | "Manichaean_Zayin" | "Meem"
+                 | "Mim"
+                 | "No_Joining_Group" | "Noon" | "Nun" | "Nya"
+                 | "Pe"
+                 | "Qaf" | "Qaph"
+                 | "Reh" | "Reversed_Pe" | "Rohingya_Yeh"
+                 | "Sad" | "Sadhe" | "Seen" | "Semkath" | "Shin"
+                 | "Straight_Waw" | "Swash_Kaf" | "Syriac_Waw"
+                 | "Tah" | "Taw" | "Teh_Marbuta" | "Teh_Marbuta_Goal"
+                 | "Teth" | "Thin_Yeh"
+                 | "Vertical_Tail"
+                 | "Waw"
+                 | "Yeh" | "Yeh_Barree" | "Yeh_With_Tail" | "Yudh"
+                 | "Yudh_He"
+                 | "Zain" | "Zhain"
+                 }?
+</tt>
+         </p>
+         <p>The Join_Control property is represented by the <tt>Join_C</tt> attribute.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2380">[joining properties,
+        29]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute Join_C { boolean }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2388">4.4.11 Linebreak properties</a>
+         </h4>
+         <p>The Line_Break property is represented by the <tt>lb</tt> attribute.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2397">[lb attribute,
+        30]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute lb { "AI" | "AK" | "AL" | "AP" | "AS"
+                 | "B2" | "BA" | "BB" | "BK"
+                 | "CB" | "CJ" | "CL" | "CM" | "CP" | "CR"
+                 | "EB" | "EM" | "EX"
+                 | "GL"
+                 | "H2" | "H3" | "HL" | "HY"
+                 | "ID" | "IN" | "IS"
+                 | "JL" | "JT" | "JV"
+                 | "LF"
+                 | "NL" | "NS" | "NU"
+                 | "OP"
+                 | "PO" | "PR"
+                 | "QU"
+                 | "RI"
+                 | "SA" | "SG" | "SP" | "SY"
+                 | "VF" | "VI"
+                 | "WJ"
+                 | "XX"
+                 | "ZW" | "ZWJ"
+                 }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2406">4.4.12 East Asian Width property</a>
+         </h4>
+         <p>The East Asian width property is represented by the <tt>ea</tt> attribute.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2413">[ea attribute,
+        31]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute ea { "A" | "F" | "H" | "N" | "Na" | "W" }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2421">4.4.13 Case properties</a>
+         </h4>
+         <p>The Uppercase, Lowercase, Other_Uppercase and
+                    Other_Lowercase properties are represented by corresponding attributes.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2434">[casing properties,
+        32]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute Upper { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Lower { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OUpper { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OLower { boolean }?
+</tt>
+         </p>
+         <p>Most characters have a case mapping and case folding properties that simply map or fold to
+                    themselves. This is very similar to the situation we encountered with names, and we adopted a
+                    similar convention: if the value of a case mapping or case folding property is the character
+                    itself, we use the attribute value # (U+0023 # NUMBER SIGN) as a shorthand notation; this
+                    enables those attributes to be captured in groups.
+                </p>
+         <p>The simple case mappings are recorded in the <tt>suc</tt>, <tt>slc</tt>, <tt>stc</tt>
+                    attributes.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2449">[casing properties,
+        33]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute suc { "#" | single-code-point }?
+
+  code-point-attributes &amp;=
+    attribute slc { "#" | single-code-point }?
+
+  code-point-attributes &amp;=
+    attribute stc { "#" | single-code-point }?
+</tt>
+         </p>
+         <p>The non-simple casing are recorded in the <tt>uc</tt>, <tt>lc</tt> and <tt>tc</tt>
+                    attributes.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2461">[casing properties,
+        34]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute uc { "#" | one-or-more-code-points }?
+
+  code-point-attributes &amp;=
+    attribute lc { "#" | one-or-more-code-points }?
+
+  code-point-attributes &amp;=
+    attribute tc { "#" | one-or-more-code-points }?
+</tt>
+         </p>
+         <p>The Simple_Case_Folding and Case_Folding properties are recorded in the
+                    <tt>scf</tt> and <tt>cf</tt> attributes respectively.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2475">[casing properties,
+        35]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute scf { "#" | single-code-point }?
+
+  code-point-attributes &amp;=
+    attribute cf { "#" | one-or-more-code-points }?
+</tt>
+         </p>
+         <p>The Case_Ignorable, Cased, Changes_When_Casefolded,
+                    Changes_When_Casemapped, Changes_When_Lowercased,
+                    Changes_When_NFKC_Casefolded, Changes_When_Titlecased,
+                    Changes_When_Uppercased, NFKC_Casefold, and
+                    NFKC_Simple_Casefold properties are recorded in these attributes:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2503">[casing properties,
+        36]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute CI { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Cased { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWCF { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWCM { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWL { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWKCF { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWT { boolean }?
+
+  code-point-attributes &amp;=
+    attribute CWU { boolean }?
+
+  code-point-attributes &amp;=
+    attribute NFKC_CF { "#" | zero-or-more-code-points }?
+
+  code-point-attributes &amp;=
+    attribute NFKC_SCF { "#" | zero-or-more-code-points }?
+</tt>
+         </p>
+         <p>Note that the UCD records more information about case folding than is expressed in the
+                    properties, specifically the entries in CaseFolding.txt with status T.
+                </p>
+         <h4>
+            <a name="d1e2513">4.4.14 Script properties</a>
+         </h4>
+         <p>The script and script extension properties are represented by the <tt>sc</tt> and
+                    <tt>scx</tt> attributes respectively.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2522">[script properties,
+        37]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  script = "Adlm" | "Aghb" | "Ahom" | "Arab" | "Armi" | "Armn"
+           | "Avst"
+           | "Bali" | "Bamu" | "Bass" | "Batk" | "Beng" | "Bhks"
+           | "Bopo" | "Brah" | "Brai" | "Bugi" | "Buhd"
+           | "Cakm" | "Cans" | "Cari" | "Cham" | "Cher" | "Chrs"
+           | "Copt" | "Cpmn" | "Cprt" | "Cyrl"
+           | "Deva" | "Diak" | "Dogr" | "Dsrt" | "Dupl"
+           | "Egyp" | "Elba" | "Elym" | "Ethi"
+           | "Gara" | "Geor" | "Glag" | "Gong" | "Gonm" | "Goth"
+           | "Gran" | "Grek" | "Gujr" | "Gukh" | "Guru"
+           | "Hang" | "Hani" | "Hano" | "Hatr" | "Hebr" | "Hira"
+           | "Hluw" | "Hmng" | "Hmnp" | "Hrkt" | "Hung"
+           | "Ital"
+           | "Java"
+           | "Kali" | "Kana" | "Kawi" | "Khar" | "Khmr" | "Khoj"
+           | "Kits" | "Knda" | "Krai" | "Kthi"
+           | "Lana" | "Laoo" | "Latn" | "Lepc" | "Limb" | "Lina"
+           | "Linb" | "Lisu" | "Lyci" | "Lydi"
+           | "Mahj" | "Maka" | "Mand" | "Mani" | "Marc" | "Medf"
+           | "Mend" | "Merc" | "Mero" | "Mlym" | "Modi" | "Mong"
+           | "Mroo" | "Mtei" | "Mult" | "Mymr"
+           | "Nagm" | "Nand" | "Narb" | "Nbat" | "Newa" | "Nkoo"
+           | "Nshu"
+           | "Ogam" | "Olck" | "Onao" | "Orkh" | "Orya" | "Osge"
+           | "Osma" | "Ougr"
+           | "Palm" | "Pauc" | "Perm" | "Phag" | "Phli" | "Phlp"
+           | "Phnx" | "Plrd" | "Prti"
+           | "Rjng" | "Rohg" | "Runr"
+           | "Samr" | "Sarb" | "Saur" | "Sgnw" | "Shaw" | "Shrd"
+           | "Sidd" | "Sind" | "Sinh" | "Sogd" | "Sogo" | "Sora"
+           | "Soyo" | "Sund" | "Sunu" | "Sylo" | "Syrc"
+           | "Tagb" | "Takr" | "Tale" | "Talu" | "Taml" | "Tang"
+           | "Tavt" | "Telu" | "Tfng" | "Tglg" | "Thaa" | "Thai"
+           | "Tibt" | "Tirh" | "Tnsa" | "Todr" | "Toto" | "Tutg"
+           | "Ugar"
+           | "Vaii" | "Vith"
+           | "Wara" | "Wcho"
+           | "Xpeo" | "Xsux"
+           | "Yezi" | "Yiii"
+           | "Zanb" | "Zinh" | "Zyyy" | "Zzzz"
+
+  code-point-attributes &amp;=
+    attribute sc { script }?
+
+  code-point-attributes &amp;=
+    attribute scx { list { script + } }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2531">4.4.15 ISO Comment properties</a>
+         </h4>
+         <p>The ISO 10646 comment field is represented by the <tt>isc</tt> attribute.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2538">[isc attribute,
+        38]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute isc { text }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2546">4.4.16 Hangul properties</a>
+         </h4>
+         <p>The property Hangul_Syllable_Type is represented by the <tt>hst</tt> attribute.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2555">[hst attribute,
+        39]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute hst { "L" | "LV" | "LVT" | "NA" | "T" | "V" }?
+</tt>
+         </p>
+         <p>The property Jamo_Short_Name is represented by the <tt>JSN</tt> attribute:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2565">[JSN attribute,
+        40]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute JSN { xsd:string { pattern="[A-Z]{0,3}" } }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2573">4.4.17 Indic properties</a>
+         </h4>
+         <p>The property Indic_Syllabic_Category is represented by the <tt>InSC</tt>
+                    attribute.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2582">[InSC attribute,
+        41]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute InSC { "Avagraha"
+                   | "Bindu"
+                   | "Brahmi_Joining_Number"
+                   | "Cantillation_Mark"
+                   | "Consonant"
+                   | "Consonant_Dead"
+                   | "Consonant_Final"
+                   | "Consonant_Head_Letter"
+                   | "Consonant_Initial_Postfixed"
+                   | "Consonant_Killer"
+                   | "Consonant_Medial"
+                   | "Consonant_Placeholder"
+                   | "Consonant_Preceding_Repha"
+                   | "Consonant_Prefixed"
+                   | "Consonant_Subjoined"
+                   | "Consonant_Succeeding_Repha"
+                   | "Consonant_With_Stacker"
+                   | "Gemination_Mark"
+                   | "Invisible_Stacker"
+                   | "Joiner"
+                   | "Modifying_Letter"
+                   | "Non_Joiner"
+                   | "Nukta"
+                   | "Number"
+                   | "Number_Joiner"
+                   | "Other"
+                   | "Pure_Killer"
+                   | "Register_Shifter"
+                   | "Reordering_Killer"
+                   | "Syllable_Modifier"
+                   | "Tone_Letter"
+                   | "Tone_Mark"
+                   | "Virama"
+                   | "Visarga"
+                   | "Vowel"
+                   | "Vowel_Dependent"
+                   | "Vowel_Independent"
+                   }?
+</tt>
+         </p>
+         <p>The property Indic_Positional_Category is represented by the <tt>InPC</tt>
+                    attribute:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2592">[InPC attribute,
+        42]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute InPC { "Bottom"
+                   | "Bottom_And_Left"
+                   | "Bottom_And_Right"
+                   | "Left"
+                   | "Left_And_Right"
+                   | "NA"
+                   | "Overstruck"
+                   | "Right"
+                   | "Top"
+                   | "Top_And_Bottom"
+                   | "Top_And_Bottom_And_Left"
+                   | "Top_And_Bottom_And_Right"
+                   | "Top_And_Left"
+                   | "Top_And_Left_And_Right"
+                   | "Top_And_Right"
+                   | "Visual_Order_Left"
+                   }?
+</tt>
+         </p>
+         <p>The property Indic_Conjunct_Break is represented by the <tt>InCB</tt> attribute:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2603">[InCB attribute,
+        43]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute InCB { "Consonant"
+                   | "Extend"
+                   | "Linker"
+                   | "None"
+                   }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2612">4.4.18 Identifier and Pattern and programming language properties</a>
+         </h4>
+         <p>The properties ID_Start, Other_ID_Start, XID_Start,
+                    ID_Continue, Other_ID_Continue, XID_Continue,
+                    ID_Compat_Math_Start, and ID_Compat_Math_Continue are represented by
+                    corresponding attributes:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2634">[identifier properties,
+        44]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute IDS { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OIDS { boolean }?
+
+  code-point-attributes &amp;=
+    attribute XIDS { boolean }?
+
+  code-point-attributes &amp;=
+    attribute IDC { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OIDC { boolean }?
+
+  code-point-attributes &amp;=
+    attribute XIDC { boolean }?
+
+  code-point-attributes &amp;=
+    attribute ID_Compat_Math_Start { boolean }?
+
+  code-point-attributes &amp;=
+    attribute ID_Compat_Math_Continue { boolean }?
+</tt>
+         </p>
+         <p>The properties Pattern_Syntax and Pattern_White_Space are represented
+                    by corresponding attributes:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2644">[pattern properties,
+        45]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute Pat_Syn { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Pat_WS { boolean }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2652">4.4.19 Properties related to function and graphic characteristics</a>
+         </h4>
+         <p>The properties Dash, Hyphen, Quotation_Mark,
+                    Terminal_Punctuation, Sentence_Terminal, Diacritic,
+                    Extender, Soft_Dotted, Alphabetic,
+                    Other_Alphabetic, Math, Other_Math, Hex_Digit,
+                    ASCII_Hex_Digit, Default_Ignorable_Code_Point,
+                    Other_Default_Ignorable_Code_Point, Logical_Order_Exception,
+                    Prepended_Concatenation_Mark, Modifier_Combining_Mark,
+                    White_Space, Vertical_Orientation, and Regional_Indicator
+                    describe the function or graphic characteristic of a character, and have each a corresponding
+                    attribute.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2704">[properties related to function and graphic characteristics,
+        46]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute Dash { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Hyphen { boolean }?
+
+  code-point-attributes &amp;=
+    attribute QMark { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Term { boolean }?
+
+  code-point-attributes &amp;=
+    attribute STerm { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Dia { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Ext { boolean }?
+
+  code-point-attributes &amp;=
+    attribute SD { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Alpha { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OAlpha { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Math { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OMath { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Hex { boolean }?
+
+  code-point-attributes &amp;=
+    attribute AHex { boolean }?
+
+  code-point-attributes &amp;=
+    attribute DI { boolean }?
+
+  code-point-attributes &amp;=
+    attribute ODI { boolean }?
+
+  code-point-attributes &amp;=
+    attribute LOE { boolean }?
+
+  code-point-attributes &amp;=
+    attribute PCM { boolean }?
+
+  code-point-attributes &amp;=
+    attribute MCM { boolean }?
+
+  code-point-attributes &amp;=
+    attribute WSpace { boolean }?
+
+  code-point-attributes &amp;=
+    attribute vo { "R" | "Tr" | "Tu" | "U" }?
+
+  code-point-attributes &amp;=
+    attribute RI { boolean }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2712">4.4.20 Properties related to boundaries</a>
+         </h4>
+         <p>The properties Grapheme_Base, Grapheme_Extend,
+                    Other_Grapheme_Extend, Grapheme_Link,
+                    Grapheme_Cluster_Break, Word_Break, and Sentence_Break each
+                    have a corresponding attribute:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2732">[properties related to boundaries,
+        47]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute Gr_Base { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Gr_Ext { boolean }?
+
+  code-point-attributes &amp;=
+    attribute OGr_Ext { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Gr_Link { boolean }?
+
+  code-point-attributes &amp;=
+    attribute GCB { "CN" | "CR"
+                  | "EB" | "EBG" | "EM" | "EX"
+                  | "GAZ"
+                  | "L" | "LF" | "LV" | "LVT"
+                  | "PP"
+                  | "RI"
+                  | "SM"
+                  | "T"
+                  | "V"
+                  | "XX"
+                  | "ZWJ"
+                  }?
+
+  code-point-attributes &amp;=
+    attribute WB { "CR"
+                 | "DQ"
+                 | "EB" | "EBG" | "EM" | "EX" | "Extend"
+                 | "FO"
+                 | "GAZ"
+                 | "HL"
+                 | "KA"
+                 | "LE" | "LF"
+                 | "MB" | "ML" | "MN"
+                 | "NL" | "NU"
+                 | "RI"
+                 | "SQ"
+                 | "WSegSpace"
+                 | "XX"
+                 | "ZWJ"
+                 }?
+
+  code-point-attributes &amp;=
+    attribute SB { "AT"
+                 | "CL" | "CR"
+                 | "EX"
+                 | "FO"
+                 | "LE" | "LF" | "LO"
+                 | "NU"
+                 | "SC" | "SE" | "SP" | "ST"
+                 | "UP"
+                 | "XX"
+                 }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2741">4.4.21 Properties related to ideographs</a>
+         </h4>
+         <p>The properties Ideographic, Unified_Ideograph,
+                    Equivalent_Unified_Ideograph, IDS_Binary_Operator,
+                    IDS_Trinary_Operator, IDS_Unary_Operator, and  Radical have
+                    corresponding attributes:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2761">[properties related to ideographs,
+        48]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute Ideo { boolean }?
+
+  code-point-attributes &amp;=
+    attribute UIdeo { boolean }?
+
+  code-point-attributes &amp;=
+    attribute EqUIdeo { single-code-point }?
+
+  code-point-attributes &amp;=
+    attribute IDSB { boolean }?
+
+  code-point-attributes &amp;=
+    attribute IDST { boolean }?
+
+  code-point-attributes &amp;=
+    attribute IDSU { boolean }?
+
+  code-point-attributes &amp;=
+    attribute Radical { boolean }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2769">4.4.22 Miscellaneous properties</a>
+         </h4>
+         <p>The properties Deprecated, Variation_Selector, and
+                    Noncharacter_Code_Point have corresponding attributes:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2780">[miscellaneous properties,
+        49]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute Dep { boolean }?
+
+  code-point-attributes &amp;=
+    attribute VS { boolean }?
+
+  code-point-attributes &amp;=
+    attribute NChar { boolean }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2788">4.4.23 Unihan properties</a>
+         </h4>
+         <p>The Unihan properties (from the Unihan database) are represented as attributes.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2792">[Unihan properties,
+        50]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;= attribute kAccountingNumeric
+    { xsd:string { pattern="[0-9]+" } }?
+
+  code-point-attributes &amp;= attribute kAlternateTotalStrokes
+    { list { xsd:string { pattern="(\d+:[BHJKMPSUV]+)|-" }+ } }?
+
+  code-point-attributes &amp;= attribute kBigFive
+    { xsd:string { pattern="[0-9A-F]{4}'?" } }?
+
+  code-point-attributes &amp;= attribute kCangjie
+    { xsd:string { pattern="[A-Z]+" } }?
+
+  code-point-attributes &amp;= attribute kCantonese
+    { list { xsd:string { pattern="[a-z]{1,6}[1-6]" }+ } }?
+
+  code-point-attributes &amp;= attribute kCCCII
+    { list { xsd:string { pattern="[0-9A-F]{6}" }+ } }?
+
+  code-point-attributes &amp;= attribute kCheungBauer
+    { list { xsd:string { pattern="[0-9]{3}/[0-9]{2};[A-Z]*;[a-z1-6\[\]/,]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kCheungBauerIndex
+    { list { xsd:string { pattern="[0-9]{3}\.[01][0-9]" }+ } }?
+
+  code-point-attributes &amp;= attribute kCihaiT
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}\.[0-9]{3}" }+ } }?
+
+  code-point-attributes &amp;= attribute kCNS1986
+    { xsd:string { pattern="[12E]-[0-9A-F]{4}" } }?
+
+  code-point-attributes &amp;= attribute kCNS1992
+    { xsd:string { pattern="[1-9]-[0-9A-F]{4}" } }?
+
+  code-point-attributes &amp;= attribute kCompatibilityVariant
+    { "" | xsd:string { pattern="U\+[23]?[0-9A-F]{4}" } }?
+
+  code-point-attributes &amp;= attribute kCowles
+    { list { xsd:string { pattern="[0-9]{1,4}(\.[0-9]{1,2})?" }+ } }?
+
+  code-point-attributes &amp;= attribute kDaeJaweon
+    { xsd:string { pattern="[0-9]{4}\.[0-9]{2}[01]" } }?
+
+  code-point-attributes &amp;= attribute kDefinition
+    { xsd:string { pattern='[^\t"]+' } }?
+
+  code-point-attributes &amp;= attribute kEACC
+    { xsd:string { pattern="[0-9A-F]{6}" } }?
+
+  code-point-attributes &amp;= attribute kFanqie
+    { list { xsd:string { pattern="[\x{3400}-\x{4DBF}\x{4E00}-\x{9FFF}\x{20000}-\x{2A6DF}]{2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kFenn
+    { list { xsd:string { pattern="[0-9]+a?[A-KP*]" }+ } }?
+
+  code-point-attributes &amp;= attribute kFennIndex
+    { list { xsd:string { pattern="[0-9][0-9]{0,2}\.[01][0-9]" }+ } }?
+
+  code-point-attributes &amp;= attribute kFourCornerCode
+    { list { xsd:string { pattern="[0-9]{4}(\.[0-9])?" }+ } }?
+
+  code-point-attributes &amp;= attribute kGB0
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGB1
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGB3
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGB5
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGB7
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGB8
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kGradeLevel
+    { xsd:string { pattern="[1-6]" } }?
+
+  code-point-attributes &amp;= attribute kGSR
+    { list { xsd:string { pattern="[0-9]{4}[a-vx-z]'?" }+ } }?
+
+  code-point-attributes &amp;= attribute kHangul
+    { list { xsd:string { pattern="[\x{1100}-\x{1112}][\x{1161}-\x{1175}][\x{11A8}-\x{11C2}]?:[01ENX]{1,3}" }+ } }?
+
+  code-point-attributes &amp;= attribute kHanYu
+    { list { xsd:string { pattern="[1-8][0-9]{4}\.[0-3][0-9][0-3]" }+ } }?
+
+  code-point-attributes &amp;= attribute kHanyuPinlu
+    { list { xsd:string { pattern="[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+\([0-9]+\)" }+ } }?
+
+  code-point-attributes &amp;= attribute kHanyuPinyin
+    { list { xsd:string { pattern="(\d{5}\.\d{2}0,)*\d{5}\.\d{2}0:([a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+,)*[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kHDZRadBreak
+    { xsd:string { pattern="[\x{2F00}-\x{2FD5}]\[U\+2F[0-9A-D][0-9A-F]\]:[1-8][0-9]{4}\.[0-3][0-9]0" } }?
+
+  code-point-attributes &amp;= attribute kHKGlyph
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kIBMJapan
+    { list { xsd:string { pattern="F[ABC][0-9A-F]{2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kIICore
+    { list { xsd:string { pattern="[ABC][GHJKMPT]{1,7}" }+ } }?
+
+  code-point-attributes &amp;= attribute kIRG_GSource
+    { "" | xsd:string { pattern="G[013578EKS]-[0-9A-F]{4}" }
+         | xsd:string { pattern="G4K(-\d{5})?" }
+         | xsd:string { pattern="G(DZ|GH|RM|WZ|XC|XH|ZH)-\d{4}\.\d{2}" }
+         | xsd:string { pattern="G(BK|CH|CY|HC)(-\d{4}\.\d{2})?" }
+         | xsd:string { pattern="GKX-\d{4}\.\d{2,3}" }
+         | xsd:string { pattern="G(HZ|HZR)-\d{5}\.\d{2}" }
+         | xsd:string { pattern="G(CE|FC|IDC23|OCD|XHZ)-\d{3}" }
+         | xsd:string { pattern="G(H|HF|LGYJ|PGLG|T)-\d{4}" }
+         | xsd:string { pattern="G(CYY|DM|JZ|KJ|XM|ZFY|ZJW|ZYS)-\d{5}" }
+         | xsd:string { pattern="G(FZ|IDC)-[0-9A-F]{4}" }
+         | xsd:string { pattern="GGFZ-\d{6}" }
+         | xsd:string { pattern="G(LK|Z)-\d{7}" }
+         | xsd:string { pattern="GU-[023][0-9A-F]{4}" }
+         | xsd:string { pattern="GZA-[123467]\d{5}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_HSource
+    { "" | xsd:string { pattern="H-[0-9A-F]{4}" }
+         | xsd:string { pattern="H(B[012])-[0-9A-F]{4}" }
+         | xsd:string { pattern="HD-[23]?[0-9A-F]{4}" }
+         | xsd:string { pattern="HU-[023][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_JSource
+    { "" | xsd:string { pattern="J[014]-[0-9A-F]{4}" }
+         | xsd:string { pattern="J3A?-[0-9A-F]{4}" }
+         | xsd:string { pattern="J13A?-[0-9A-F]{4}" }
+         | xsd:string { pattern="J14-[0-9A-F]{4}" }
+         | xsd:string { pattern="JA[34]?-[0-9A-F]{4}" }
+         | xsd:string { pattern="JARIB-[0-9A-F]{4}" }
+         | xsd:string { pattern="JH-(JT[ABC][0-9A-F]{3}S?|IB\d{4}|\d{6})" }
+         | xsd:string { pattern="JK-\d{5}" }
+         | xsd:string { pattern="JMJ-\d{6}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_KPSource
+    { "" | xsd:string { pattern="KP([01]-[0-9A-F]{4}|U-[023][0-9A-F]{4})" } }?
+
+  code-point-attributes &amp;= attribute kIRG_KSource
+    { "" | xsd:string { pattern="K[0-6]-[0-9A-F]{4}" }
+         | xsd:string { pattern="KC-\d{5}" }
+         | xsd:string { pattern="KU-[023][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_MSource
+    { "" | xsd:string { pattern="MA-[0-9A-F]{4}" }
+         | xsd:string { pattern="MB[12]-[0-9A-F]{4}" }
+         | xsd:string { pattern="MC-\d{5}" }
+         | xsd:string { pattern="MDH?-[23]?[0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_SSource
+    { "" | xsd:string { pattern="SAT-\d{5}" } }?
+
+  code-point-attributes &amp;= attribute kIRG_TSource
+    { "" | xsd:string { pattern="T([1-7A-F]|1[1-3])-[0-9A-F]{4}" }
+         | xsd:string { pattern="TU-[023][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRG_UKSource
+    { "" | xsd:string { pattern="UK-\d{5}" } }?
+
+  code-point-attributes &amp;= attribute kIRG_USource
+    { "" | xsd:string { pattern="UTC-\d{5}" } }?
+
+  code-point-attributes &amp;= attribute kIRG_VSource
+    { "" | xsd:string { pattern="V[0-4]-[0-9A-F]{4}" }
+         | xsd:string { pattern="VN-[023F][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &amp;= attribute kIRGDaeJaweon
+    { list { xsd:string { pattern="[0-9]{4}\.[0-9]{2}[01]" }+ } }?
+
+  code-point-attributes &amp;= attribute kIRGHanyuDaZidian
+    { list { xsd:string { pattern="[1-8][0-9]{4}\.[0-3][0-9][01]" }+ } }?
+
+  code-point-attributes &amp;= attribute kIRGKangXi
+    { list { xsd:string { pattern="[01][0-9]{3}\.[0-7][0-9][01]" }+ } }?
+
+  code-point-attributes &amp;= attribute kJa
+    { list { xsd:string { pattern="[0-9A-F]{4}S?" }+ } }?
+
+  code-point-attributes &amp;= attribute kJapanese
+    { list { xsd:string { pattern="[\x{3041}-\x{3096}\x{3099}\x{309A}\x{30A1}-\x{30FA}\x{30FC}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kJapaneseKun
+    { list { xsd:string { pattern="[A-Z]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kJapaneseOn
+    { list { xsd:string { pattern="[A-Z]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kJinmeiyoKanji
+    { list { xsd:string { pattern="(20[0-9]{2})(:U\+[23]?[0-9A-F]{4})?" }+ } }?
+
+  code-point-attributes &amp;= attribute kJis0
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kJis1
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kJIS0213
+    { list { xsd:string { pattern="[12],[0-9]{2},[0-9]{1,2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kJoyoKanji
+    { list { xsd:string { pattern="(20[0-9]{2})|(U\+[23]?[0-9A-F]{4})" }+ } }?
+
+  code-point-attributes &amp;= attribute kKangXi
+    { list { xsd:string { pattern="[0-9]{4}\.[0-9]{2}[01]" }+ } }?
+
+  code-point-attributes &amp;= attribute kKarlgren
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}[A*]?" }+ } }?
+
+  code-point-attributes &amp;= attribute kKorean
+    { list { xsd:string { pattern="[A-Z]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kKoreanEducationHanja
+    { list { xsd:string { pattern="20[0-9]{2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kKoreanName
+    { list { xsd:string { pattern="20[0-9]{2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kLau
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}" }+ } }?
+
+  code-point-attributes &amp;= attribute kMainlandTelegraph
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kMandarin
+    { list { xsd:string { pattern="[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kMatthews
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}(a|\.5)?" }+ } }?
+
+  code-point-attributes &amp;= attribute kMeyerWempe
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}[a-t*]?" }+ } }?
+
+  code-point-attributes &amp;= attribute kMojiJoho
+    { list { xsd:string { pattern="MJ\d{6}(:(FE0[01]|E01[01][0-9A-F]))?" }+ } }?
+
+  code-point-attributes &amp;= attribute kMorohashi
+    { list { xsd:string { pattern="(\d{5}'{0,2}|H\d{3})(:(FE0[01]|E010[0-9A-F]))?" }+ } }?
+
+  code-point-attributes &amp;= attribute kNelson
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kOtherNumeric
+    { list { xsd:string { pattern="[0-9]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kPhonetic
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}[A-D]?\*?" }+ } }?
+
+  code-point-attributes &amp;= attribute kPrimaryNumeric
+    { list { xsd:string { pattern="[0-9]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kPseudoGB1
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &amp;= attribute kRSAdobe_Japan1_6
+    { list { xsd:string { pattern="[CV]\+[0-9]{1,5}\+[1-9][0-9]{0,2}\.[1-9][0-9]?\.[0-9]{1,2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kRSUnicode
+    { list { xsd:string { pattern="[1-9][0-9]{0,2}'{0,3}\.-?[0-9]{1,2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kSBGY
+    { list { xsd:string { pattern="[0-9]{3}\.[0-7][0-9]" }+ } }?
+
+  code-point-attributes &amp;= attribute kSemanticVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}(&lt;[ks][A-Za-z0-9_]+(:[TBZFJ]+)?(,[ks][A-Za-z0-9_]+(:[TBZFJ]+)?)*)?" }+ } }?
+
+  code-point-attributes &amp;= attribute kSimplifiedVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kSMSZD2003Index
+    { list { xsd:string { pattern="\d{1,3}\.\d{2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kSMSZD2003Readings
+    { list { xsd:string { pattern="[a-z\x{300}\x{301}\x{302}\x{304}\x{308}\x{30C}]+(,[a-z\x{300}\x{301}\x{302}\x{304}\x{308}\x{30C}]+)*\x{7CB5}[a-z]+[1-6]([a-z]+[1-6])?(,[a-z]+[1-6]([a-z]+[1-6])?)*" }+ } }?
+
+  code-point-attributes &amp;= attribute kSpecializedSemanticVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}(&lt;[ks][A-Za-z0-9_]+(:[TBZFJ]+)?(,[ks][A-Za-z0-9_]+(:[TBZFJ]+)?)*)?" }+ } }?
+
+  code-point-attributes &amp;= attribute kSpoofingVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kStrange
+    { list { ( xsd:string { pattern="[ACU]" }
+             | xsd:string { pattern="B:U\+31[0-2AB][0-9A-F]" }
+             | xsd:string { pattern="[FMOR](:U\+[23]?[0-9A-F]{4})?" }
+             | xsd:string { pattern="H:U\+31[3-8][0-9A-F]" }
+             | xsd:string { pattern="I(:U\+[23]?[0-9A-F]{4})*" }
+             | xsd:string { pattern="K(:U\+30[A-F][0-9A-F])+" }
+             | xsd:string { pattern="S:[4-9][0-9]" }
+    )+}}?
+
+  code-point-attributes &amp;= attribute kTaiwanTelegraph
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kTang
+    { list { xsd:string { pattern="\*?[A-Za-z()\x{E6}\x{251}\x{259}\x{25B}\x{300}\x{30C}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kTGH
+    { list { xsd:string { pattern="20[0-9]{2}:[1-9][0-9]{0,3}" }+ } }?
+
+  code-point-attributes &amp;= attribute kTGHZ2013
+    { list { xsd:string { pattern="[0-9]{3}\.[0-9]{3}(,[0-9]{3}\.[0-9]{3})*:[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kTotalStrokes
+    { list { xsd:string { pattern="[1-9][0-9]{0,2}" }+ } }?
+
+  code-point-attributes &amp;= attribute kTraditionalVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}" }+ } }?
+
+  code-point-attributes &amp;= attribute kUnihanCore2020
+    { xsd:string { pattern="[GHJKMPT]{1,7}" } }?
+
+  code-point-attributes &amp;= attribute kVietnamese
+    { list { xsd:string { pattern="[A-Za-z\x{110}\x{111}\x{300}-\x{303}\x{306}\x{309}\x{31B}\x{323}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kVietnameseNumeric
+    { list { xsd:string { pattern="\d+" }+ } }?
+
+  code-point-attributes &amp;= attribute kXerox
+    { list { xsd:string { pattern="[0-9]{3}:[0-9]{3}" }+ } }?
+
+  code-point-attributes &amp;= attribute kXHC1983
+    { list { xsd:string { pattern="[0-9]{4}\.[0-9]{3}\*?(,[0-9]{4}\.[0-9]{3}\*?)*:[a-z\x{300}\x{301}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &amp;= attribute kZhuang
+    { list { xsd:string { pattern="[a-z]+\*?" }+ } }?
+
+  code-point-attributes &amp;= attribute kZhuangNumeric
+    { list { xsd:string { pattern="\d+" }+ } }?
+
+  code-point-attributes &amp;= attribute kZVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}(&lt;[ks][A-Za-z0-9_]+(:[TBZ]+)?(,[ks][A-Za-z0-9_]+(:[TBZ]+)?)*)?" }+ } }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2801">4.4.24 Tangut data</a>
+         </h4>
+         <p>The Tangut data are represented as attributes. The attribute <tt>kRSTUnicode</tt>
+                    represents the radical stroke index. The attribute <tt>kTGT_MergedSrc</tt> indicates the
+                    source reference for the character.
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2810">[Tangut data,
+        51]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute kRSTUnicode { xsd:string { pattern="[0-9]+\.[0-9]+" } }?
+
+  code-point-attributes &amp;=
+    attribute kTGT_MergedSrc 
+     { xsd:string {pattern="L2008-[0-9A-F]{4,5}(-[0-9]{4,5})?"}
+     | xsd:string {pattern="L2006-[0-9]{4}"}
+     | xsd:string {pattern="L1997-[0-9]{4}"}
+     | xsd:string {pattern="L1986-[0-9]{4}"}
+     | xsd:string {pattern="S1968-[0-9]{4}"}
+     | xsd:string {pattern="N1966-[0-9]{3}(-[0-9A-Z]{3,4})?"}
+     | xsd:string {pattern="H2004-[A-Z]-[0-9]{4}"}
+     | xsd:string {pattern="L2012-[0-9]{4}"}
+     | xsd:string {pattern="UTN42-[0-9]{3}"}
+     }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2818">4.4.25 Nushu data</a>
+         </h4>
+         <p>The Nushu data are represented as attributes. The attribute <tt>kSrc_NushuDuben</tt>
+                    indicates the page number and order of the item from the NushuDuben reference source. Nushu common
+                    reading is represented as <tt>kReading</tt>.</p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2827">[Nushu data,
+        52]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute kSrc_NushuDuben { xsd:string { pattern="[0-9]+\.[0-9]+" } }?
+
+  code-point-attributes &amp;=
+    attribute kReading { xsd:string }?
+</tt>
+         </p>
+         <h4>
+            <a name="d1e2835">4.4.26 Emoji properties</a>
+         </h4>
+         <p>The properties Emoji, EPres, EMod, EBase,
+                    EComp, and ExtPict have corresponding attributes:
+                </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2853">[Emoji properties,
+        53]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  code-point-attributes &amp;=
+    attribute Emoji { boolean }?
+
+  code-point-attributes &amp;=
+    attribute EPres { boolean }?
+
+  code-point-attributes &amp;=
+    attribute EMod { boolean }?
+
+  code-point-attributes &amp;=
+    attribute EBase { boolean }?
+
+  code-point-attributes &amp;=
+    attribute EComp { boolean }?
+
+  code-point-attributes &amp;=
+    attribute ExtPict { boolean }?
+</tt>
+         </p>
+         <h2>
+            <a name="d1e2864">5 Blocks</a>
+         </h2>
+         <p>The <tt>blocks</tt> child of the <tt>ucd</tt> describes the blocks. It has one child
+            <tt>block</tt> element per block, with attributes to describe the extent and name of the block.
+        </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2876">[blocks,
+        54]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  ucd.content &amp;=
+    element blocks {
+      element block {
+        attribute first-cp { single-code-point },
+        attribute last-cp { single-code-point },
+        attribute name { text } }+ }?
+</tt>
+         </p>
+         <h2>
+            <a name="d1e2884">6 Named Sequences</a>
+         </h2>
+         <p>The <tt>named-sequences</tt> child of the <tt>ucd</tt> describes the named sequences. It has one
+            child <tt>named-sequence</tt> element per named sequence, with attributes to describe the name and
+            sequence.
+        </p>
+         <p>Similarly, the <tt>provisional-named-sequences</tt> child of the <tt>ucd</tt> describes the
+            provisional named sequences.
+        </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2903">[named sequences,
+        55]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  ucd.content &amp;=
+    element named-sequences {
+      element named-sequence {
+        attribute cps { one-or-more-code-points },
+        attribute name { text } }+ }?
+
+  ucd.content &amp;=
+    element provisional-named-sequences {
+      element named-sequence {
+        attribute cps { one-or-more-code-points },
+        attribute name { text } }+ }?
+</tt>
+         </p>
+         <h2>
+            <a name="d1e2911">7 Normalization Corrections</a>
+         </h2>
+         <p>The <tt>normalization-corrections</tt> child of the <tt>ucd</tt> describes the normalization
+            corrections. It has one child <tt>normalization-correction</tt> element per correction, with
+            attributes to describe the code point affected, its old normalization, its new normalization and the
+            version of Unicode in which the correction was made.
+        </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2923">[normalization corrections,
+        56]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  ucd.content &amp;=
+    element normalization-corrections {
+      element normalization-correction {
+        attribute cp { single-code-point },
+        attribute old { one-or-more-code-points },
+        attribute new { one-or-more-code-points },
+        attribute version { text } }+ }?
+</tt>
+         </p>
+         <h2>
+            <a name="d1e2932">8 Standardized Variants</a>
+         </h2>
+         <p>The <tt>standardized-variants</tt> child of the <tt>ucd</tt> describes the standardized
+            variant. It has one child element <tt>standardized-variant</tt> per variant. The attributes on that
+            last element capture the variation sequence, the description of the desired appearance, and the shaping
+            environment under which the appearance is different.
+        </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2944">[standardized variants,
+        57]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  ucd.content &amp;=
+    element standardized-variants {
+      element standardized-variant {
+        attribute cps { two-code-points },
+        attribute desc { text },
+        attribute when { text } }+ }?
+</tt>
+         </p>
+         <h2>
+            <a name="d1e2952">9 CJK Radicals</a>
+         </h2>
+         <p>The <tt>cjk-radicals</tt> child of the <tt>ucd</tt> describes the CJK radicals. It has one
+            child element <tt>cjk-radical</tt> per radical. The attributes on that last element capture the
+            radical number, the corresponding CJK radical character, and the corresponding CJK unified ideograph.
+        </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2964">[cjk radicals,
+        58]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  ucd.content &amp;=
+    element cjk-radicals {
+      element cjk-radical {
+        attribute number { xsd:string {pattern="[0-9]{1,3}'{0,3}"}},
+        attribute radical { single-code-point? },
+        attribute ideograph { single-code-point } }+ }?
+</tt>
+         </p>
+         <h2>
+            <a name="d1e2972">10 Emoji sources</a>
+         </h2>
+         <p>The <tt>emoji-sources</tt> child of the <tt>ucd</tt> describes the emoji sources.
+        </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2982">[emoji sources,
+        59]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  ucd.content &amp;=
+    element emoji-sources {
+      element emoji-source {
+        attribute unicode { one-or-more-code-points },
+        attribute docomo { jis-code-point? },
+        attribute kddi { jis-code-point? },
+        attribute softbank { jis-code-point? } }+ }?
+</tt>
+         </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e2986">[datatype for code points,
+        60]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  jis-code-point = xsd:string { pattern = "[0-9A-F]{4}" }
+</tt>
+         </p>
+         <h2>
+            <a name="d1e2995">11 Do Not Emit</a>
+         </h2>
+         <p>
+            <span style="background-color: #ffff00; border-style:dotted; border-width:1px">The <tt>do-not-emit</tt> child of the <tt>ucd</tt> describes the
+            character sequences that should not be emitted or generated in newly authored texts.
+            </span>
+         </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e3006">[do-not-emit,
+        61]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+  ucd.content &amp;=
+    element do-not-emit {
+      element instead {
+        attribute of { one-or-more-code-points },
+        attribute use { one-or-more-code-points },
+        attribute because { "Bengali_Khanda_Ta"
+                          | "Deprecated"
+                          | "Discouraged"
+                          | "Dotless_Form"
+                          | "Hamza_Form"
+                          | "Indic_Atomic_Consonant"
+                          | "Indic_Consonant_Conjunct"
+                          | "Indic_Vowel_Letter"
+                          | "Malayalam_Chillu"
+                          | "Precomposed_Form"
+                          | "Precomposed_Hieroglyph"
+                          | "Preferred_Spelling"
+                          | "Tamil_Shrii"
+      } }+ }?
+</tt>
+         </p>
+         <h2>
+            <a name="d1e3014">12 The full schema</a>
+         </h2>
+         <p>Our schema is just the accumulation of the pieces we have described so far:
+        </p>
+         <p>
+            <i>
+               <a name="ucdxml:d1e3018">[UCD RelaxNG schema]
+      </a>
+        =</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[namespace declaration: <a href="#ucdxml:d1e1812">1</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[datatypes: <a href="#ucdxml:d1e1829">2</a>, <a href="#ucdxml:d1e1837">3</a>, <a href="#ucdxml:d1e2986">60</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[schema start: <a href="#ucdxml:d1e1854">4</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[boolean: <a href="#ucdxml:d1e1871">5</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[description: <a href="#ucdxml:d1e1914">6</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[repertoire: <a href="#ucdxml:d1e1933">7</a>, <a href="#ucdxml:d1e1947">8</a>, <a href="#ucdxml:d1e1992">9</a>, <a href="#ucdxml:d1e2047">10</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[attributes: <a href="#ucdxml:d1e2092">11</a>, <a href="#ucdxml:d1e2109">12</a>, <a href="#ucdxml:d1e2112">13</a>, <a href="#ucdxml:d1e2160">14</a>, <a href="#ucdxml:d1e2177">15</a>, <a href="#ucdxml:d1e2192">16</a>, <a href="#ucdxml:d1e2211">17</a>, <a href="#ucdxml:d1e2226">18</a>, <a href="#ucdxml:d1e2234">19</a>, <a href="#ucdxml:d1e2243">20</a>, <a href="#ucdxml:d1e2255">21</a>, <a href="#ucdxml:d1e2266">22</a>, <a href="#ucdxml:d1e2269">23</a>, <a href="#ucdxml:d1e2288">24</a>, <a href="#ucdxml:d1e2303">25</a>, <a href="#ucdxml:d1e2328">26</a>, <a href="#ucdxml:d1e2349">27</a>, <a href="#ucdxml:d1e2369">28</a>, <a href="#ucdxml:d1e2380">29</a>, <a href="#ucdxml:d1e2397">30</a>, <a href="#ucdxml:d1e2413">31</a>, <a href="#ucdxml:d1e2434">32</a>, <a href="#ucdxml:d1e2449">33</a>, <a href="#ucdxml:d1e2461">34</a>, <a href="#ucdxml:d1e2475">35</a>, <a href="#ucdxml:d1e2503">36</a>, <a href="#ucdxml:d1e2522">37</a>, <a href="#ucdxml:d1e2538">38</a>, <a href="#ucdxml:d1e2555">39</a>, <a href="#ucdxml:d1e2565">40</a>, <a href="#ucdxml:d1e2582">41</a>, <a href="#ucdxml:d1e2592">42</a>, <a href="#ucdxml:d1e2603">43</a>, <a href="#ucdxml:d1e2634">44</a>, <a href="#ucdxml:d1e2644">45</a>, <a href="#ucdxml:d1e2704">46</a>, <a href="#ucdxml:d1e2732">47</a>, <a href="#ucdxml:d1e2761">48</a>, <a href="#ucdxml:d1e2780">49</a>, <a href="#ucdxml:d1e2792">50</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[Tangut data: <a href="#ucdxml:d1e2810">51</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[Nushu data: <a href="#ucdxml:d1e2827">52</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[blocks: <a href="#ucdxml:d1e2876">54</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[named sequences: <a href="#ucdxml:d1e2903">55</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[normalization corrections: <a href="#ucdxml:d1e2923">56</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[standardized variants: <a href="#ucdxml:d1e2944">57</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[cjk radicals: <a href="#ucdxml:d1e2964">58</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[emoji sources: <a href="#ucdxml:d1e2982">59</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[Emoji properties: <a href="#ucdxml:d1e2853">53</a>]</i>
+            <tt style="white-space: pre;">
+      </tt>
+            <i>[do-not-emit: <a href="#ucdxml:d1e3006">61</a>]</i>
+            <tt style="white-space: pre;">
+</tt>
+         </p>
+         <p>An expanded version is linked from the top of this document.</p>
+         <h2>
+            <a name="d1e3064">13 Examples</a>
+         </h2>
+         <p>Here is a fragment of the UCD for a few representative
+            characters (only some of the properties are represented):
+        </p>
+         <pre>
+            
+  &lt;ucd xmlns="http://www.unicode.org/ns/2003/ucd/1.0"&gt;
+    &lt;repertoire&gt;
+      &lt;char cp="001F" age="1.1" na="&amp;lt;control&amp;gt;" na1="UNIT SEPARATOR"
+            gc="Cc" bc="S" lb="CM"/&gt;
+
+      &lt;char cp="0020" age="1.1" na="SPACE" gc="Zs" bc="WS" ea="Na" lb="SP"/&gt;
+
+      &lt;char cp="0026" age="1.1" na="AMPERSAND" gc="Po" bc="ON" ea="Na"/&gt;
+
+      &lt;char cp="0028" age="1.1" na="LEFT PARENTHESIS" na1="OPENING PARENTHESIS"
+            gc="Ps" bc="ON" Bidi_M="y" bmg="0029" ea="Na" lb="OP"/&gt;
+
+      &lt;char cp="0041" age="1.1" na="LATIN CAPITAL LETTER A"
+            gc="Lu" slc="0061" ea="Na" sc="Latn"/&gt;
+
+      &lt;char cp="AC00" age="2.0" na="HANGUL SYLLABLE GA" gc="Lo"
+            dt="can" dm="1100 1161" ea="W" lb="ID" sc="Hang"/&gt;
+
+      &lt;char cp="20094" age="3.1" na="CJK UNIFIED IDEOGRAPH-20094"
+            gc="Lo" ea="W" lb="ID" sc="Hani" kIRG_GSource="KX"
+            kIRGHanyuDaZidian="10036.060" kIRG_TSource="5-214E"
+           kRSUnicode="4.3" kIRGKangXi="0082.090"/&gt;
+
+      &lt;group age="3.2" gc="Lo" sc="Buhd"&gt;
+        &lt;char cp="1740" na="BUHID LETTER A"/&gt;
+        &lt;char cp="1741" na="BUHID LETTER I"/&gt;
+        &lt;char cp="1752" na="BUHID VOWEL SIGN I" gc="Mn"/&gt;
+        &lt;char cp="1820" age="3.0" na="MONGOLIAN LETTER A" sc="Mong"/&gt;
+      &lt;/group&gt;
+    &lt;/repertoire&gt;
+  &lt;/ucd&gt;
+
+</pre>
+         <h2>
+            <a name="d1e3076">Acknowledgments</a>
+         </h2>
+         <p>Thanks to Markus Scherer and Mark Davis for their help developing this XML representation. Thanks to
+            the reviewers: Julie Allen, Ernest van den Boogaard, Daniel Bünzli, John Cowan, Asmus Freytag,
+            Felix Sasaki, Andrew West. Special thanks to Eric Muller and Laurențiu Iancu.
+        </p>
+         <h2>
+            <a name="Modifications">Modifications</a>
+         </h2>
+         <p>This section indicates the changes introduced by each revision.</p>
+         <div>
+            <p>
+               <b>Revision 36</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>16.0</tt>.
+                    </li>
+               <li>New values for the <tt>blk</tt> attribute: <tt>Egyptian_Hieroglyphs_Ext_A</tt>, <tt>
+                        Garay</tt>, <tt>Gurung_Khema</tt>, <tt>Kirat_Rai</tt>, <tt>Myanmar_Ext_C</tt>, <tt>
+                        Ol_Onal</tt>, <tt>Sunuwar</tt>, <tt>Symbols_for_Legacy_Computing_Sup</tt>, <tt>
+                        Todhri</tt>, <tt>Tulu_Tigalari</tt>.
+                    </li>
+               <li>New values for the <tt>script</tt> attribute: <tt>Gara</tt>, <tt>Gukh</tt>, <tt>
+                        Krai</tt>, <tt>Onao</tt>, <tt>Sunu</tt>, <tt>Todr</tt>, <tt>Tutg</tt>.
+                    </li>
+               <li>New value for the <tt>jg</tt> attribute: <tt>Kashmiri_Yeh</tt>.</li>
+               <li>New value for the <tt>InSC</tt> attribute: <tt>Reordering_Killer</tt>.
+                    </li>
+               <li>New attributes: <tt>MCM</tt>, <tt>kFanqie</tt>, <tt>kZhuang</tt>.
+                    </li>
+               <li>Modified patterns for the <tt>cjk-radical/@number</tt>, <tt>kRSUnicode</tt> and <tt>
+                        kIRG_GSource
+                    </tt> attributes.
+                    </li>
+               <li>Added the <tt>do-not-emit</tt> element.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 35 being a proposed update, only changes between revisions 34 and 36 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 34</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>15.1</tt>.
+                    </li>
+               <li>New value for the <tt>blk</tt> attribute: <tt>CJK_Ext_I</tt>.
+                    </li>
+               <li>New values for the <tt>lb</tt> attribute: <tt>AK</tt>, <tt>AP</tt>, <tt>
+                        AS</tt>, <tt>VF</tt>, <tt>VI</tt>.
+                    </li>
+               <li>Modified values for the <tt>number</tt>, <tt>radical</tt> attributes of the <tt>
+                        cjk-radical
+                    </tt> element.
+                    </li>
+               <li>Changed single value into list for the <tt>nv</tt> code point attribute.
+                    </li>
+               <li>New code point attributes: <tt>ID_Compat_Math_Continue</tt>, <tt>
+                        ID_Compat_Math_Start</tt>, <tt>IDSU</tt>, <tt>NFKC_SCF</tt>, <tt>InCB</tt>.
+                    </li>
+               <li>Modified patterns for the <tt>kBigFive</tt>, <tt>kIRG_GSource</tt>, <tt>
+                        kMorohashi</tt>, <tt>kRSUnicode</tt> attributes.
+                    </li>
+               <li>Changed single values into lists for the <tt>kMorohashi</tt>, <tt>kPrimaryNumeric
+                    </tt> Unihan attributes.
+                    </li>
+               <li>New Unihan attributes: <tt>kJapanese</tt>, <tt>kMojiJoho</tt>, <tt>
+                        kSMSZD2003Index</tt>, <tt>kSMSZD2003Readings</tt>, <tt>kVietnameseNumeric</tt>, <tt>
+                        kZhuangNumeric</tt>.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 33 being a proposed update, only changes between revisions 32 and 34 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 32</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>15.0</tt>.
+                    </li>
+               <li>New values for the <tt>blk</tt> attribute: <tt>Arabic_Ext_C</tt>, <tt>CJK_Ext_H</tt>, <tt>
+                        Cyrillic_Ext_D</tt>, <tt>Devanagari_Ext_A</tt>, <tt>Kaktovik_Numerals</tt>, <tt>Kawi</tt>, <tt>
+                        Nag_Mundari</tt>.
+                    </li>
+               <li>New values for the <tt>script</tt> attribute: <tt>Kawi</tt>, <tt>Nagm</tt>.
+                    </li>
+               <li>New Unihan attribute: <tt>kAlternateTotalStrokes</tt>.
+                    </li>
+               <li>Modified patterns for the <tt>kIRG_GSource</tt>, <tt>kIRG_HSource</tt>, <tt>
+                        kIRG_TSource</tt>, <tt>kSemanticVariant</tt>, <tt>kSpecializedSemanticVariant</tt>, <tt>
+                        kZVariant
+                    </tt> attributes.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 31 being a proposed update, only changes between revisions 30 and 32 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 30</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>14.0</tt>.
+                    </li>
+               <li>New values for the <tt>blk</tt> attribute: <tt>Arabic_Ext_B</tt>, <tt>
+                        Cypro_Minoan</tt>, <tt>Ethiopic_Ext_B</tt>, <tt>Kana_Ext_B</tt>, <tt>
+                        Latin_Ext_F</tt>, <tt>Latin_Ext_G</tt>, <tt>Old_Uyghur</tt>, <tt>Tangsa</tt>, <tt>
+                        Toto</tt>, <tt>UCAS_Ext_A</tt>, <tt>Vithkuqi</tt>, <tt>Znamenny_Music</tt>.
+                    </li>
+               <li>New values for the <tt>script</tt> attribute: <tt>Cpmn</tt>, <tt>Ougr</tt>, <tt>
+                        Tnsa</tt>, <tt>Toto</tt>, <tt>Vith</tt>.
+                    </li>
+               <li>New values for the <tt>jg</tt> attribute: <tt>Thin_Yeh</tt>, <tt>Vertical_Tail</tt>.
+                    </li>
+               <li>New Unihan attribute: <tt>kStrange</tt>.
+                    </li>
+               <li>Modified patterns for the <tt>kIRG_GSource</tt>, <tt>kIRG_MSource</tt>, <tt>
+                        kIRG_VSource</tt>, <tt>kPhonetic</tt>, <tt>kSpoofingVariant</tt> attributes.
+                    </li>
+               <li>Removal of the <tt>kWubi</tt> attribute, which has never been present in
+                        released versions of the UCD.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 29 being a proposed update, only changes between revisions 28 and 30 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 28</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>13.0</tt>.
+                    </li>
+               <li>New values for the <tt>blk</tt> attribute: <tt>Chorasmian</tt>, <tt>CJK_Ext_G</tt>, <tt>
+                        Dives_Akuru</tt>, <tt>Khitan_Small_Script</tt>, <tt>Lisu_Sup</tt>, <tt>
+                        Symbols_For_Legacy_Computing</tt>, <tt>Tangut_Sup</tt>, <tt>Yezidi</tt>.
+                    </li>
+               <li>New values for the <tt>script</tt> attribute: <tt>Chrs</tt>, <tt>Diak</tt>, <tt>
+                        Kits</tt>, <tt>Yezi</tt>.
+                    </li>
+               <li>New value for the <tt>InPC</tt> attribute: <tt>Top_And_Bottom_And_Left</tt>.
+                    </li>
+               <li>New Unihan attributes <tt>kSpoofingVariant</tt>, <tt>kUnihanCore2020</tt>, <tt>
+                        kIRG_SSource</tt>, <tt>kIRG_UKSource</tt>, <tt>kTGHZ2013</tt>.
+                    </li>
+               <li>New Emoji attributes <tt>Emoji</tt>, <tt>EPres</tt>, <tt>EMod</tt>, <tt>
+                        EBase</tt>, <tt>EComp</tt>, <tt>ExtPict</tt>.
+                    </li>
+               <li>Modified patterns for the <tt>kIRG_GSource</tt>, <tt>kIRG_HSource</tt>, <tt>
+                        kIRG_KPSource</tt>, <tt>kIRG_KSource</tt>, <tt>kIRG_TSource</tt>, <tt>kKangXi</tt>, <tt>
+                        kSemanticVariant</tt>, <tt>kSimplifiedVariant</tt>, <tt>
+                        kSpecializedSemanticVariant</tt>, <tt>kTraditionalVariant</tt> attributes.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 27 being a proposed update, only changes between revisions 26 and 28 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 26</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>12.1</tt>.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>
+               <b>Revision 25</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>12.0</tt>.
+                    </li>
+               <li>New values for the <tt>script</tt> attribute: <tt>Elym</tt>, <tt>Hmnp</tt>, <tt>
+                        Nand</tt>, <tt>Wcho</tt>.
+                    </li>
+               <li>New values for the <tt>blk</tt> attribute: <tt>
+                        Egyptian_Hieroglyph_Format_Controls</tt>, <tt>Elymaic</tt>, <tt>Nandinagari</tt>, <tt>
+                        Nyiakeng_Puachue_Hmong</tt>, <tt>Ottoman_Siyaq_Numbers</tt>, <tt>Small_Kana_Ext</tt>, <tt>
+                        Symbols_And_Pictographs_Ext_A</tt>, <tt>Tamil_Sup</tt>, <tt>Wancho</tt>.
+                    </li>
+               <li>Modified patterns for the <tt>kIRG_GSource</tt>, <tt>kIRG_KSource</tt>, <tt>
+                        kIRG_TSource</tt>, <tt>kTaiwanTelegraph</tt> attributes.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 24 being a proposed update, only changes between revisions 23 and 25 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 23</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>11.0</tt>.
+                    </li>
+               <li>New values for the <tt>blk</tt> attribute: <tt>Chess_Symbols</tt>, <tt>
+                        Dogra</tt>, <tt>Georgian_Ext</tt>, <tt>Gunjala_Gondi</tt>, <tt>
+                        Hanifi_Rohingya</tt>, <tt>Indic_Siyaq_Numbers</tt>, <tt>Makasar</tt>, <tt>
+                        Mayan_Numerals</tt>, <tt>Medefaidrin</tt>, <tt>Old_Sogdian</tt>, <tt>Sogdian</tt>.
+                    </li>
+               <li>New values for the <tt>script</tt> attribute: <tt>Dogr</tt>, <tt>Gong</tt>, <tt>
+                        Maka</tt>, <tt>Medf</tt>, <tt>Rohg</tt>, <tt>Sogd</tt>, <tt>Sogo</tt>.
+                    </li>
+               <li>New values for the <tt>jg</tt> attribute: <tt>Hanifi_Rohingya_Kinna_Ya</tt>, <tt>
+                        Hanifi_Rohingya_Pa</tt>.
+                    </li>
+               <li>New value for the <tt>wb</tt> attribute: <tt>WSegSpace</tt>.
+                    </li>
+               <li>New values for the <tt>InSC</tt> attribute: <tt>Consonant_Initial_Postfixed</tt>.
+                    </li>
+               <li>New attributes: <tt>EqUIdeo</tt>, <tt>kJinmeiyoKanji</tt>, <tt>kJoyoKanji</tt>, <tt>
+                        kKoreanEducationHanja</tt>, <tt>kKoreanName</tt>, <tt>kTGH</tt>.
+                    </li>
+               <li>Modified patterns for the <tt>kTGT_MergedSrc</tt> attribute.
+                    </li>
+               <li>Modified patterns for the <tt>kIRG_GSource</tt>, <tt>kIRG_HSource</tt> and <tt>
+                        kIRG_VSource
+                    </tt> attributes.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 22 being a proposed update, only changes between revisions 21 and 23 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 21</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>10.0</tt>.
+                    </li>
+               <li>New values for the <tt>blk</tt> attribute: <tt>CJK_Ext_F</tt>, <tt>Kana_Ext_A</tt>, <tt>
+                        Masaram_Gondi</tt>, <tt>Nushu</tt>, <tt>Soyombo</tt>, <tt>Syriac_Sup</tt>, <tt>
+                        Zanabazar_Square</tt>.
+                    </li>
+               <li>New values for the <tt>sc</tt> attribute: <tt>Gonm</tt>, <tt>Nshu</tt>, <tt>
+                        Soyo</tt>, <tt>Zanb</tt>.
+                    </li>
+               <li>New values for the <tt>jg</tt> attribute: <tt>Malayalam_Nga</tt>, <tt>
+                        Malayalam_Ja</tt>, <tt>Malayalam_Nya</tt>, <tt>Malayalam_Tta</tt>, <tt>Malayalam_Nna</tt>, <tt>
+                        Malayalam_Nnna</tt>, <tt>Malayalam_Bha</tt>, <tt>Malayalam_Ra</tt>, <tt>
+                        Malayalam_Lla</tt>, <tt>Malayalam_Llla</tt>, <tt>Malayalam_Ssa</tt>.
+                    </li>
+               <li>New value for the <tt>InPC</tt> attribute: <tt>Bottom_And_Left</tt>.
+                    </li>
+               <li>Modified patterns for the <tt>kIRG_GSource</tt>, <tt>kIRG_JSource</tt>, <tt>
+                        kIRG_KSource
+                    </tt> attributes.
+                    </li>
+               <li>New code point attributes: <tt>vo</tt>,
+                        <tt>RI</tt>
+               </li>
+               <li>New code point attributes for Nushu data: <tt>kSrc_NushuDuben</tt> and <tt>
+                        kReading</tt>.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 20 being a proposed update, only changes between revisions 19 and 21 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 19</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>9.0</tt>.
+                    </li>
+               <li>New values for the <tt>sc</tt> attribute: <tt>Adlm</tt>, <tt>Bhks</tt>, <tt>
+                        Marc</tt>, <tt>Newa</tt>, <tt>Osge</tt>, <tt>Tang</tt>.
+                    </li>
+               <li>New values for the <tt>blk</tt> attribute: <tt>Adlam</tt>, <tt>Bhaiksuki</tt>, <tt>
+                        Cyrillic_Ext_C</tt>, <tt>Glagolitic_Sup</tt>, <tt>Ideographic_Symbols</tt>, <tt>
+                        Marchen</tt>, <tt>Mongolian_Sup</tt>, <tt>Newa</tt>, <tt>Osage</tt>, <tt>
+                        Tangut</tt>, <tt>Tangut_Components</tt>.
+                    </li>
+               <li>New values for the <tt>gcb</tt> attribute: <tt>EB</tt>, <tt>EBG</tt>, <tt>EM</tt>, <tt>
+                        GAZ</tt>, <tt>ZWJ</tt>.
+                    </li>
+               <li>New values for the <tt>wb</tt> attribute: <tt>EB</tt>, <tt>EBG</tt>, <tt>EM</tt>, <tt>
+                        GAZ</tt>, <tt>ZWJ</tt>.
+                    </li>
+               <li>New values for the <tt>lb</tt> attribute: <tt>EB</tt>, <tt>EM</tt>, <tt>ZWJ</tt>.
+                    </li>
+               <li>New values for the <tt>jg</tt> attribute: <tt>African_Feh</tt>, <tt>
+                        African_Noon</tt>, <tt>African_Qaf</tt>.
+                    </li>
+               <li>New code point attributes: <tt>PCM</tt>, <tt>kRSTUnicode</tt> and <tt>
+                        kTGT_MergedSrc</tt>.
+                    </li>
+               <li>Modified patterns for the <tt>kRSUnicode</tt>, <tt>kRSKangXi</tt>, <tt>
+                        kMandarin</tt>, <tt>kIRG_JSource</tt>, <tt>kIRG_USource</tt> and <tt>kFennIndex
+                    </tt> attributes.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 18 being a proposed update, only changes between revisions 17 and 19 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 17</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>8.0</tt>.
+                    </li>
+               <li>New values for the <tt>sc</tt> attribute: <tt>Ahom</tt>, <tt>Hatr</tt>, <tt>
+                        Hluw</tt>, <tt>Hung</tt>, <tt>Mult</tt>, <tt>Sgnw</tt>.
+                    </li>
+               <li>New values for the <tt>blk</tt> attribute: <tt>Ahom</tt>, <tt>
+                        Anatolian_Hieroglyphs</tt>, <tt>Cherokee_Sup</tt>, <tt>CJK_Ext_E</tt>, <tt>
+                        Early_Dynastic_Cuneiform</tt>, <tt>Hatran</tt>, <tt>Multani</tt>, <tt>Old_Hungarian</tt>, <tt>
+                        Sup_Symbols_And_Pictographs</tt>, <tt>Sutton_SignWriting</tt>.
+                    </li>
+               <li>New values for the <tt>InSC</tt> attribute: <tt>Consonant_Killer</tt>, <tt>
+                        Consonant_Prefixed</tt>, <tt>Consonant_With_Stacker</tt>, <tt>Syllable_Modifier</tt>.
+                    </li>
+               <li>New code point attributes: <tt>InPC</tt>, <tt>kJa</tt>.
+                    </li>
+               <li>New patterns for the <tt>kIRG_GSource</tt> attribute: <tt>GFC-</tt>, <tt>GGFZ-</tt>.
+                    </li>
+               <li>Switched the reference to ISO 19757 from :2003 and :2003 Amd1 to :2008.</li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 16 being a proposed update, only changes between revisions 15 and 17 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 15</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>7.0</tt>.
+                    </li>
+               <li>New values for the <tt>jg</tt> attribute.
+                    </li>
+               <li>New values for the <tt>sc</tt> attribute.
+                    </li>
+               <li>New values for the <tt>blk</tt> attribute.
+                    </li>
+               <li>New values for the <tt>InSC</tt> attribute.
+                    </li>
+               <li>New values for the <tt>kIICore</tt> attribute.
+                    </li>
+               <li>New values for the <tt>kIRG_GSource</tt> attribute.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 14 being a proposed update, only changes between revisions 13 and 15 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 13</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>6.3</tt>.
+                    </li>
+               <li>New values <tt>DQ</tt>, <tt>HL</tt>, <tt>SQ</tt> for the <tt>WB</tt> attribute(forUnicode6.3).
+                    </li>
+               <li>New code point attributes <tt>bpt</tt> and <tt>bpb</tt> (for Unicode 6.3).
+                    </li>
+               <li>New values for the <tt>bc</tt> attribute: <tt>LRI</tt>, <tt>RLI</tt>, <tt>FSI</tt>, <tt>
+                        PDI
+                    </tt> (for Unicode 6.3).
+                    </li>
+               <li>Updated the patterns for <tt>kHanyuPinlu</tt> and <tt>kTotalStrokes</tt> (for
+                        Unicode6.3).
+                    </li>
+               <li>Updated the patterns for <tt>kIRG_HSource</tt> and <tt>kIRG_HSource</tt> (for
+                        Unicode6.2).
+                    </li>
+               <li>Clarified that the child elements list-like elements are in no particular order.</li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 12 being a proposed update, only changes between revisions 11 and 13 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 11</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>6.2</tt>.
+                    </li>
+               <li>New value for the <tt>gcb</tt>, <tt>wb</tt> and <tt>lb</tt> attributes:<tt>
+                        RI
+                    </tt> (for Unicode 6.2).
+                    </li>
+               <li>Updated the patterns for <tt>kIRG_GSource</tt> and <tt>kIRG_HSource</tt> (for
+                        Unicode 6.2).
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 10 being a proposed update, only changes between revisions 9 and 11 are
+                noted here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 9</b>
+            </p>
+            <ul>
+               <li>Clarified the default values.</li>
+               <li>Indicate that property values may change from one release to the next.</li>
+               <li>Introduced the <tt>blk</tt> attributes, for the Block property.
+                    </li>
+               <li>Introduced the <tt>scx</tt> attribute, for the ScriptExtensions property.
+                    </li>
+               <li>Introduced the <tt>name-alias</tt> element, for the Name_Alias property.
+                    </li>
+               <li>New value for the <tt>age</tt> attribute: <tt>6.1</tt>.
+                    </li>
+               <li>New values for the <tt>script</tt> attribute: <tt>Cakm</tt>, <tt>Merc</tt>, <tt>
+                        Mero</tt>, <tt>Plrd</tt>, <tt>Shrd</tt>, <tt>Sora</tt>, <tt>Takr</tt>.
+                    </li>
+               <li>New values for the <tt>lb</tt> attribute: <tt>HL</tt> and <tt>CJ</tt>.
+                    </li>
+               <li>New value for the <tt>jg</tt> attribute: <tt>Rohingya_Yeh</tt>.
+                    </li>
+               <li>The value of the <tt>fc_nfkc</tt> attribute must now be either # or <tt>
+                        one-or-more-code-points</tt>.
+                    </li>
+               <li>For the <tt>nv</tt> attribute, the absence of a numeric value is now represented by<tt>
+                        NaN
+                    </tt> rather than by the empty string.
+                    </li>
+               <li>The values of the ccc are now restricted to 0..254, instead of 0..255.
+                    </li>
+               <li>Updated the patterns for <tt>kSemanticVariant</tt>, <tt>
+                        kSpecializedSemanticVariant</tt>, <tt>kIRG_USource</tt>, and <tt>kMandarin</tt>.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 8 being a proposed update, only changes between revisions 7 and 9 are noted
+                here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 7</b>
+            </p>
+            <ul>
+               <li>New value for the <tt>age</tt> attribute: <tt>6.0</tt>.
+                    </li>
+               <li>New value for the <tt>jg</tt> attribute:
+                        <tt>Teh_Marbuta_Goal</tt>
+               </li>
+               <li>New values for the <tt>script</tt> attribute: <tt>Batk</tt>, <tt>Brah</tt>, <tt>
+                        Mand</tt>.
+                    </li>
+               <li>Updated the patterns for <tt>kIRG_GSource</tt>, <tt>kIRG_HSource</tt>, <tt>
+                        kIRG_JSource</tt>, <tt>kIRG_KSource</tt>, <tt>kIRG_MSource</tt>, <tt>
+                        kIRG_TSource</tt>, <tt>kIRG_VSource</tt>.
+                    </li>
+               <li>Added the <tt>InSC</tt> and <tt>InMC</tt> elements.
+                    </li>
+               <li>Added the <tt>emoji-sources</tt> element.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 6 being a proposed update, only changes between revisions 5 and 7 are noted
+                here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 5</b>
+            </p>
+            <ul>
+               <li>Changed the type of <tt>block/@first-cp</tt>, <tt>block/@last-cp</tt> and <tt>
+                        normalization-corrections/@cp
+                    </tt> from <tt>text</tt> to
+                        <tt>single-code-point</tt>
+               </li>
+               <li>Changed the type of <tt>named-sequence/@cps</tt>, <tt>
+                        provisional-named-sequences/@cps</tt>, <tt>normalization-correction/@old</tt> and <tt>
+                        normalization-correction/@new
+                    </tt> from <tt>text</tt> to <tt>one-or-more-code-points</tt>.
+                    </li>
+               <li>Changed the type of <tt>standardized-variants/@cps</tt> from <tt>text</tt> to <tt>
+                        two-code-points</tt>.
+                    </li>
+               <li>New values for the <tt>jg</tt> attribute: <tt>Farsi_Yeh</tt> and <tt>Nya</tt>.
+                    </li>
+               <li>New value for the <tt>age</tt> attribute: <tt>5.2</tt>.
+                    </li>
+               <li>New values for the <tt>sc</tt> attribute: <tt>Lana</tt>, <tt>Tavt</tt>, <tt>
+                        Avst</tt>, <tt>Egyp</tt>, <tt>Samr</tt>, <tt>Lisu</tt>, <tt>Bamu</tt>, <tt>Java</tt>, <tt>
+                        Mtei</tt>, <tt>Armi</tt>, <tt>Sarb</tt>, <tt>Prti</tt>, <tt>Phli</tt>, <tt>Orkh</tt>, <tt>
+                        Kthi</tt>.
+                    </li>
+               <li>New value for the <tt>lb</tt> attribute: <tt>CP</tt>.
+                    </li>
+               <li>New value for the <tt>sc</tt> attribute: <tt>Zinh</tt>.
+                    </li>
+               <li>New code point attributes CI, <tt>Cased</tt>, <tt>CWCF</tt>, <tt>
+                        CWCM</tt>, <tt>CWL</tt>, <tt>CWKCF</tt>, <tt>CWT</tt>, <tt>CWU</tt>, <tt>
+                        NFKC_CF</tt>.
+                    </li>
+               <li>New attributes <tt>kHanyuPinyin</tt> and <tt>kIRG_MSource</tt>.
+                    </li>
+               <li>New element
+                        <tt>cjk-radicals</tt>
+               </li>
+               <li>Updated the patterns for <tt>kIRG_GSource</tt>, <tt>kIRG_JSource</tt>, <tt>
+                        kIRG_KPSource</tt>, <tt>kIRG_KSource</tt>, <tt>kIRG_TSource</tt>, <tt>
+                        kIRG_VSource</tt>, <tt>kHanyuPinlu</tt>, <tt>kMandarin</tt>, <tt>
+                        kSemanticVariant</tt>, <tt>kSpecializedSemanticVariant</tt>, <tt>
+                        kVietnamese</tt>, <tt>kZVariant</tt>.
+                    </li>
+               <li>Point out that Relax NG schemas do not modify or augment the infoset, and that it ispossible
+                        to convert mechanically our schema to other schema languages.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>Revision 4 being a proposed update, only changes between revisions 3 and 5 are noted
+                here.
+            </p>
+         </div>
+         <div>
+            <p>
+               <b>Revision 3</b>
+            </p>
+            <ul>
+               <li>First approved version, for Unicode 5.1.0.</li>
+               <li>For optional elements which acts as collections, such as <tt>repertoire</tt> and <tt>
+                        named-sequences</tt>, impose that there be at least one element in the collection.
+                    </li>
+               <li>Remove the constraint that the value <tt>jg</tt> is limited when <tt>jt</tt> has
+                        certainvalues; similarly for <tt>bmg</tt> / <tt>Bidi_M</tt> and for <tt>nv</tt> /
+                        <tt>nt</tt>.
+                    </li>
+               <li>Value <tt>NL</tt> added to the <tt>WB</tt> attribute (for Unicode 5.1).
+                    </li>
+               <li>Value <tt>PP</tt> added to the <tt>GCB</tt> attribute (for Unicode 5.1).
+                    </li>
+               <li>Corrected the <tt>Vai</tt> script value to <tt>Vaii</tt>.
+                    </li>
+               <li>Removed the discussion of elements or attributes in different namespace.</li>
+               <li>Removed the <tt>code-point</tt> element.
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>
+               <b>Revision 2</b>
+            </p>
+            <ul>
+               <li>Promoted to Draft UAX.</li>
+               <li>Changed the title from "An XML representation of the UCD"</li>
+               <li>Value <tt>5.1</tt> added to the <tt>age</tt> attribute (for Unicode 5.1).
+                    </li>
+               <li>Value <tt>SM</tt> added to the <tt>gcb</tt> attribute (for Unicode 5.1).
+                    </li>
+               <li>Values <tt>CR</tt>, <tt>Extend</tt>, <tt>LF</tt>, <tt>MB</tt> added to the <tt>
+                        WB
+                    </tt> attribute(forUnicode5.1).
+                    </li>
+               <li>Values <tt>CR</tt>, <tt>EX</tt>, <tt>LF</tt>, <tt>SC</tt> added to the <tt>SB
+                    </tt> attribute(forUnicode5.1).
+                    </li>
+               <li>Value <tt>Burushaski_Yeh_Barree</tt> added to the <tt>jg</tt> attribute (for
+                        Unicode5.1).
+                    </li>
+               <li>Value <tt>Alef_Maqsurah</tt> added to the <tt>jg</tt> attribute (for Unicode 2.x).
+                    </li>
+               <li>Values <tt>Cari</tt>, <tt>Cham</tt>, <tt>Kali</tt>, <tt>Lepc</tt>, <tt>
+                        Lyci</tt>, <tt>Lydi</tt>, <tt>Olck</tt>, <tt>Rjng</tt>, <tt>Saur</tt>, <tt>Sund</tt> and <tt>
+                        Vai
+                    </tt> added to the <tt>sc</tt> attribute (forUnicode5.0).
+                    </li>
+               <li>
+                  <tt>jamo</tt>
+                        attribute renamed to
+                        <tt>JSN</tt>
+               </li>
+               <li>
+                  <tt>sfc</tt>
+                        attribute renamed to
+                        <tt>scf</tt>
+               </li>
+               <li>Attribute <tt>kXHC1983</tt> added (for Unicode 5.1.0).
+                    </li>
+               <li>Pattern for attribute <tt>kIRG_USource</tt> extended (for Unicode 5.1.0).
+                    </li>
+               <li>Element <tt>provisional-named-sequences</tt> added (for Unicode 5.0)
+                    </li>
+            </ul>
+         </div>
+         <div>
+            <p>
+               <b>Revision 1</b>
+            </p>
+            <ul>
+               <li>First working draft.</li>
+            </ul>
+         </div>
+         <hr/>
+         <p class="copyright">© 2008–2024 Unicode, Inc. This
+      publication is protected by copyright, and permission must be obtained from Unicode, Inc. prior to any
+      reproduction, modification, or other use not permitted by the
+      <a href="https://www.unicode.org/copyright.html">Terms of Use</a>. Specifically, you may make copies of this
+      publication and may annotate and translate it solely for personal or internal business purposes and not for
+      public distribution, provided that any such permitted copies and modifications fully reproduce all copyright and
+      other legal notices contained in the original. You may not make copies of or modifications to this publication
+      for public distribution, or incorporate it in whole or in part into any product or publication without the
+      express written permission of Unicode.</p>
+         <p class="copyright">Use of all Unicode Products, including this publication, is governed by the Unicode
+      <a href="https://www.unicode.org/copyright.html">Terms of Use</a>. The authors, contributors, and publishers have
+      taken care in the preparation of this publication, but make no express or implied representation or warranty of
+      any kind and assume no responsibility or liability for errors or omissions or for consequential or incidental
+      damages that may arise therefrom. This publication is provided “AS-IS” without charge as a convenience to
+      users.</p>
+         <p class="copyright">Unicode and the Unicode Logo are registered trademarks of Unicode, Inc., in the United States
+      and other countries.</p>
+      </div>
+   </body>
+</html>
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/output/index.rnc b/unicodetools/src/main/resources/org/unicode/uax42/output/index.rnc
new file mode 100644
index 000000000..84d9b5875
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/output/index.rnc
@@ -0,0 +1,1455 @@
+
+    # Copyright © 2024 Unicode, Inc.
+
+    
+      
+  default namespace ucd = "http://www.unicode.org/ns/2003/ucd/1.0"
+
+      
+  # default; datatypes xsd = "http://www.w3.org/2001/XMLSchema-datatypes"
+
+  single-code-point = xsd:string { pattern = "(|[1-9A-F]|(10))[0-9A-F]{4}" }
+
+  one-or-more-code-points = list { single-code-point + }
+  zero-or-more-code-points = list { single-code-point * }
+  two-code-points = list { single-code-point, single-code-point }
+
+  jis-code-point = xsd:string { pattern = "[0-9A-F]{4}" }
+
+      
+  start =
+    element ucd { ucd.content }
+
+      
+  boolean = "Y" | "N"
+
+      
+  ucd.content &=
+    element description { text }?
+
+      
+  ucd.content &=
+    element repertoire { (code-point | group) + }?
+
+  set-of-code-points =
+     attribute cp { single-code-point }
+   | ( attribute first-cp { single-code-point },
+       attribute last-cp  { single-code-point } )
+
+  code-point |=
+    element reserved {
+      set-of-code-points,
+      code-point-attributes }
+
+  code-point |=
+    element noncharacter {
+      set-of-code-points,
+      code-point-attributes }
+
+  code-point |=
+    element surrogate {
+      set-of-code-points,
+      code-point-attributes }
+
+  code-point |=
+    element char {
+      set-of-code-points,
+      code-point-attributes }
+
+  group =
+    element group {
+      code-point-attributes,
+      code-point* }
+
+      
+  code-point-attributes &=
+    attribute age { "1.1"
+                  | "2.0" | "2.1"
+                  | "3.0" | "3.1" | "3.2"
+                  | "4.0" | "4.1"
+                  | "5.0" | "5.1" | "5.2"
+                  | "6.0" | "6.1" | "6.2" | "6.3"
+                  | "7.0"
+                  | "8.0"
+                  | "9.0"
+                  | "10.0"
+                  | "11.0"
+                  | "12.0" | "12.1"
+                  | "13.0"
+                  | "14.0"
+                  | "15.0" | "15.1"
+                  | "16.0"
+                  | "17.0"
+                  | "unassigned"
+                  }?
+
+  code-point-attributes &=
+    attribute na { "" |
+                   "CJK UNIFIED IDEOGRAPH-#" |
+                   "CJK COMPATIBILITY IDEOGRAPH-#" |
+                   "EGYPTIAN HIEROGLYPH-#" |
+                   "TANGUT IDEOGRAPH-#" |
+                   "KHITAN SMALL SCRIPT CHARACTER-#" |
+                   "NUSHU CHARACTER-#" |
+                   xsd:string { pattern="[a-zA-Z0-9]+(( -|- |[\-_ ])[a-zA-Z0-9]+)*" }
+                 }?
+
+  code-point-attributes &=
+    attribute na1 { "" | xsd:string { pattern="[a-zA-Z0-9]+([\-_ ][a-zA-Z0-9]+)*( \(.*\))?" } }?
+
+  code-point-attributes &=
+    element name-alias {
+      attribute alias { xsd:string { pattern="[a-zA-Z0-9]+(( -|- |[\-_ ])[a-zA-Z0-9]+)*" } }?,
+      attribute type  { "abbreviation" | "alternate"
+                      | "control" | "correction"
+                      | "figment"
+                      }? } *
+
+  code-point-attributes &=
+    attribute blk { "Adlam"
+                  | "Aegean_Numbers"
+                  | "Ahom"
+                  | "Alchemical"
+                  | "Alphabetic_PF"
+                  | "Anatolian_Hieroglyphs"
+                  | "Ancient_Greek_Music"
+                  | "Ancient_Greek_Numbers"
+                  | "Ancient_Symbols"
+                  | "Arabic"
+                  | "Arabic_Ext_A"
+                  | "Arabic_Ext_B"
+                  | "Arabic_Ext_C"
+                  | "Arabic_Math"
+                  | "Arabic_PF_A"
+                  | "Arabic_PF_B"
+                  | "Arabic_Sup"
+                  | "Armenian"
+                  | "Arrows"
+                  | "ASCII"
+                  | "Avestan"
+                  | "Balinese"
+                  | "Bamum"
+                  | "Bamum_Sup"
+                  | "Bassa_Vah"
+                  | "Batak"
+                  | "Bengali"
+                  | "Bhaiksuki"
+                  | "Block_Elements"
+                  | "Bopomofo"
+                  | "Bopomofo_Ext"
+                  | "Box_Drawing"
+                  | "Brahmi"
+                  | "Braille"
+                  | "Buginese"
+                  | "Buhid"
+                  | "Byzantine_Music"
+                  | "Carian"
+                  | "Caucasian_Albanian"
+                  | "Chakma"
+                  | "Cham"
+                  | "Cherokee"
+                  | "Cherokee_Sup"
+                  | "Chess_Symbols"
+                  | "Chorasmian"
+                  | "CJK"
+                  | "CJK_Compat"
+                  | "CJK_Compat_Forms"
+                  | "CJK_Compat_Ideographs"
+                  | "CJK_Compat_Ideographs_Sup"
+                  | "CJK_Ext_A"
+                  | "CJK_Ext_B"
+                  | "CJK_Ext_C"
+                  | "CJK_Ext_D"
+                  | "CJK_Ext_E"
+                  | "CJK_Ext_F"
+                  | "CJK_Ext_G"
+                  | "CJK_Ext_H"
+                  | "CJK_Ext_I"
+                  | "CJK_Radicals_Sup"
+                  | "CJK_Strokes"
+                  | "CJK_Symbols"
+                  | "Compat_Jamo"
+                  | "Control_Pictures"
+                  | "Coptic"
+                  | "Coptic_Epact_Numbers"
+                  | "Counting_Rod"
+                  | "Cuneiform"
+                  | "Cuneiform_Numbers"
+                  | "Currency_Symbols"
+                  | "Cypriot_Syllabary"
+                  | "Cypro_Minoan"
+                  | "Cyrillic"
+                  | "Cyrillic_Ext_A"
+                  | "Cyrillic_Ext_B"
+                  | "Cyrillic_Ext_C"
+                  | "Cyrillic_Ext_D"
+                  | "Cyrillic_Sup"
+                  | "Deseret"
+                  | "Devanagari"
+                  | "Devanagari_Ext"
+                  | "Devanagari_Ext_A"
+                  | "Diacriticals"
+                  | "Diacriticals_Ext"
+                  | "Diacriticals_For_Symbols"
+                  | "Diacriticals_Sup"
+                  | "Dingbats"
+                  | "Dives_Akuru"
+                  | "Dogra"
+                  | "Domino"
+                  | "Duployan"
+                  | "Early_Dynastic_Cuneiform"
+                  | "Egyptian_Hieroglyph_Format_Controls"
+                  | "Egyptian_Hieroglyphs"
+                  | "Egyptian_Hieroglyphs_Ext_A"
+                  | "Elbasan"
+                  | "Elymaic"
+                  | "Emoticons"
+                  | "Enclosed_Alphanum"
+                  | "Enclosed_Alphanum_Sup"
+                  | "Enclosed_CJK"
+                  | "Enclosed_Ideographic_Sup"
+                  | "Ethiopic"
+                  | "Ethiopic_Ext"
+                  | "Ethiopic_Ext_A"
+                  | "Ethiopic_Ext_B"
+                  | "Ethiopic_Sup"
+                  | "Garay"
+                  | "Geometric_Shapes"
+                  | "Geometric_Shapes_Ext"
+                  | "Georgian"
+                  | "Georgian_Ext"
+                  | "Georgian_Sup"
+                  | "Glagolitic"
+                  | "Glagolitic_Sup"
+                  | "Gothic"
+                  | "Grantha"
+                  | "Greek"
+                  | "Greek_Ext"
+                  | "Gujarati"
+                  | "Gunjala_Gondi"
+                  | "Gurmukhi"
+                  | "Gurung_Khema"
+                  | "Half_And_Full_Forms"
+                  | "Half_Marks"
+                  | "Hangul"
+                  | "Hanifi_Rohingya"
+                  | "Hanunoo"
+                  | "Hatran"
+                  | "Hebrew"
+                  | "High_PU_Surrogates"
+                  | "High_Surrogates"
+                  | "Hiragana"
+                  | "IDC"
+                  | "Ideographic_Symbols"
+                  | "Imperial_Aramaic"
+                  | "Indic_Number_Forms"
+                  | "Indic_Siyaq_Numbers"
+                  | "Inscriptional_Pahlavi"
+                  | "Inscriptional_Parthian"
+                  | "IPA_Ext"
+                  | "Jamo"
+                  | "Jamo_Ext_A"
+                  | "Jamo_Ext_B"
+                  | "Javanese"
+                  | "Kaithi"
+                  | "Kaktovik_Numerals"
+                  | "Kana_Ext_A"
+                  | "Kana_Ext_B"
+                  | "Kana_Sup"
+                  | "Kanbun"
+                  | "Kangxi"
+                  | "Kannada"
+                  | "Katakana"
+                  | "Katakana_Ext"
+                  | "Kawi"
+                  | "Kayah_Li"
+                  | "Kharoshthi"
+                  | "Khitan_Small_Script"
+                  | "Khmer"
+                  | "Khmer_Symbols"
+                  | "Khojki"
+                  | "Khudawadi"
+                  | "Kirat_Rai"
+                  | "Lao"
+                  | "Latin_1_Sup"
+                  | "Latin_Ext_A"
+                  | "Latin_Ext_Additional"
+                  | "Latin_Ext_B"
+                  | "Latin_Ext_C"
+                  | "Latin_Ext_D"
+                  | "Latin_Ext_E"
+                  | "Latin_Ext_F"
+                  | "Latin_Ext_G"
+                  | "Lepcha"
+                  | "Letterlike_Symbols"
+                  | "Limbu"
+                  | "Linear_A"
+                  | "Linear_B_Ideograms"
+                  | "Linear_B_Syllabary"
+                  | "Lisu"
+                  | "Lisu_Sup"
+                  | "Low_Surrogates"
+                  | "Lycian"
+                  | "Lydian"
+                  | "Mahajani"
+                  | "Mahjong"
+                  | "Makasar"
+                  | "Malayalam"
+                  | "Mandaic"
+                  | "Manichaean"
+                  | "Marchen"
+                  | "Masaram_Gondi"
+                  | "Math_Alphanum"
+                  | "Math_Operators"
+                  | "Mayan_Numerals"
+                  | "Medefaidrin"
+                  | "Meetei_Mayek"
+                  | "Meetei_Mayek_Ext"
+                  | "Mende_Kikakui"
+                  | "Meroitic_Cursive"
+                  | "Meroitic_Hieroglyphs"
+                  | "Miao"
+                  | "Misc_Arrows"
+                  | "Misc_Math_Symbols_A"
+                  | "Misc_Math_Symbols_B"
+                  | "Misc_Pictographs"
+                  | "Misc_Symbols"
+                  | "Misc_Technical"
+                  | "Modi"
+                  | "Modifier_Letters"
+                  | "Modifier_Tone_Letters"
+                  | "Mongolian"
+                  | "Mongolian_Sup"
+                  | "Mro"
+                  | "Multani"
+                  | "Music"
+                  | "Myanmar"
+                  | "Myanmar_Ext_A"
+                  | "Myanmar_Ext_B"
+                  | "Myanmar_Ext_C"
+                  | "Nabataean"
+                  | "Nag_Mundari"
+                  | "Nandinagari"
+                  | "NB"
+                  | "New_Tai_Lue"
+                  | "Newa"
+                  | "NKo"
+                  | "Number_Forms"
+                  | "Nushu"
+                  | "Nyiakeng_Puachue_Hmong"
+                  | "OCR"
+                  | "Ogham"
+                  | "Ol_Chiki"
+                  | "Ol_Onal"
+                  | "Old_Hungarian"
+                  | "Old_Italic"
+                  | "Old_North_Arabian"
+                  | "Old_Permic"
+                  | "Old_Persian"
+                  | "Old_Sogdian"
+                  | "Old_South_Arabian"
+                  | "Old_Turkic"
+                  | "Old_Uyghur"
+                  | "Oriya"
+                  | "Ornamental_Dingbats"
+                  | "Osage"
+                  | "Osmanya"
+                  | "Ottoman_Siyaq_Numbers"
+                  | "Pahawh_Hmong"
+                  | "Palmyrene"
+                  | "Pau_Cin_Hau"
+                  | "Phags_Pa"
+                  | "Phaistos"
+                  | "Phoenician"
+                  | "Phonetic_Ext"
+                  | "Phonetic_Ext_Sup"
+                  | "Playing_Cards"
+                  | "Psalter_Pahlavi"
+                  | "PUA"
+                  | "Punctuation"
+                  | "Rejang"
+                  | "Rumi"
+                  | "Runic"
+                  | "Samaritan"
+                  | "Saurashtra"
+                  | "Sharada"
+                  | "Shavian"
+                  | "Shorthand_Format_Controls"
+                  | "Siddham"
+                  | "Sinhala"
+                  | "Sinhala_Archaic_Numbers"
+                  | "Small_Forms"
+                  | "Small_Kana_Ext"
+                  | "Sogdian"
+                  | "Sora_Sompeng"
+                  | "Soyombo"
+                  | "Specials"
+                  | "Sundanese"
+                  | "Sundanese_Sup"
+                  | "Sunuwar"
+                  | "Sup_Arrows_A"
+                  | "Sup_Arrows_B"
+                  | "Sup_Arrows_C"
+                  | "Sup_Math_Operators"
+                  | "Sup_PUA_A"
+                  | "Sup_PUA_B"
+                  | "Sup_Punctuation"
+                  | "Sup_Symbols_And_Pictographs"
+                  | "Super_And_Sub"
+                  | "Sutton_SignWriting"
+                  | "Syloti_Nagri"
+                  | "Symbols_And_Pictographs_Ext_A"
+                  | "Symbols_For_Legacy_Computing"
+                  | "Symbols_For_Legacy_Computing_Sup"
+                  | "Syriac"
+                  | "Syriac_Sup"
+                  | "Tagalog"
+                  | "Tagbanwa"
+                  | "Tags"
+                  | "Tai_Le"
+                  | "Tai_Tham"
+                  | "Tai_Viet"
+                  | "Tai_Xuan_Jing"
+                  | "Takri"
+                  | "Tamil"
+                  | "Tamil_Sup"
+                  | "Tangsa"
+                  | "Tangut"
+                  | "Tangut_Components"
+                  | "Tangut_Sup"
+                  | "Telugu"
+                  | "Thaana"
+                  | "Thai"
+                  | "Tibetan"
+                  | "Tifinagh"
+                  | "Tirhuta"
+                  | "Todhri"
+                  | "Toto"
+                  | "Transport_And_Map"
+                  | "Tulu_Tigalari"
+                  | "UCAS"
+                  | "UCAS_Ext"
+                  | "UCAS_Ext_A"
+                  | "Ugaritic"
+                  | "Vai"
+                  | "Vedic_Ext"
+                  | "Vertical_Forms"
+                  | "Vithkuqi"
+                  | "VS"
+                  | "VS_Sup"
+                  | "Wancho"
+                  | "Warang_Citi"
+                  | "Yezidi"
+                  | "Yi_Radicals"
+                  | "Yi_Syllables"
+                  | "Yijing"
+                  | "Zanabazar_Square"
+                  | "Znamenny_Music"
+                  }?
+
+  code-point-attributes &=
+    attribute gc { "Cc" | "Cf" | "Cn" | "Co" | "Cs"
+                 | "Ll" | "Lm" | "Lo" | "Lt" | "Lu"
+                 | "Mc" | "Me" | "Mn"
+                 | "Nd" | "Nl" | "No"
+                 | "Pc" | "Pd" | "Pe" | "Pf" | "Pi" | "Po" | "Ps"
+                 | "Sc" | "Sk" | "Sm" | "So"
+                 | "Zl" | "Zp" | "Zs"
+                 }?
+
+  code-point-attributes &=
+    attribute ccc { xsd:integer { minInclusive="0" maxInclusive="254" } }?
+
+  code-point-attributes &=
+    attribute bc { "AL" | "AN"
+                 | "B" | "BN"
+                 | "CS"
+                 | "EN" | "ES" | "ET"
+                 | "FSI"
+                 | "L" | "LRE" | "LRI" | "LRO"
+                 | "NSM"
+                 | "ON"
+                 | "PDF" | "PDI"
+                 | "R" | "RLE" | "RLI" | "RLO"
+                 | "S"
+                 | "WS"
+                 }?
+
+  code-point-attributes &=
+    attribute Bidi_M { boolean }?
+
+  code-point-attributes &=
+    attribute bmg { "" | single-code-point }?
+
+  code-point-attributes &=
+    attribute Bidi_C { boolean }?
+
+  code-point-attributes &=
+    attribute bpt { "o" | "c" | "n" }?
+
+  code-point-attributes &=
+    attribute bpb { "#" | single-code-point }?
+
+  code-point-attributes &=
+    attribute dt { "can" | "com" | "enc" | "fin" | "font" | "fra"
+                 | "init" | "iso" | "med" | "nar" | "nb" | "sml"
+                 | "sqr" | "sub" | "sup" | "vert" | "wide" | "none"
+                 }?
+
+  code-point-attributes &=
+    attribute dm { "#" | zero-or-more-code-points }?
+
+  code-point-attributes &=
+    attribute CE { boolean }?
+
+  code-point-attributes &=
+    attribute Comp_Ex { boolean }?
+
+  code-point-attributes &=
+    attribute NFC_QC { "Y" | "N" | "M" }?
+
+  code-point-attributes &=
+    attribute NFD_QC { "Y" | "N" }?
+
+  code-point-attributes &=
+    attribute NFKC_QC { "Y" | "N" | "M" }?
+
+  code-point-attributes &=
+    attribute NFKD_QC { "Y" | "N" }?
+
+
+  code-point-attributes &=
+    attribute XO_NFC { boolean }?
+
+  code-point-attributes &=
+    attribute XO_NFD { boolean }?
+
+  code-point-attributes &=
+    attribute XO_NFKC { boolean }?
+
+  code-point-attributes &=
+    attribute XO_NFKD { boolean }?
+
+
+  code-point-attributes &=
+    attribute FC_NFKC { "#" | one-or-more-code-points }?
+
+  code-point-attributes &=
+    attribute nt { "De" | "Di" | "Nu" | "None" }?
+
+  code-point-attributes &=
+    attribute nv { "NaN" | xsd:string { pattern="-?[0-9]+(/[0-9]+)?" } }?
+
+  code-point-attributes &=
+    attribute jt { "C" | "D" | "L" | "R" | "T" | "U" }?
+
+  code-point-attributes &=
+    attribute jg { "African_Feh" | "African_Noon" | "African_Qaf"
+                 | "Ain" | "Alaph" | "Alef"
+                 | "Beh" | "Beth" | "Burushaski_Yeh_Barree"
+                 | "Dal" | "Dalath_Rish"
+                 | "E"
+                 | "Farsi_Yeh" | "Fe" | "Feh" | "Final_Semkath"
+                 | "Gaf" | "Gamal"
+                 | "Hah" | "Hanifi_Rohingya_Kinna_Ya"
+                 | "Hanifi_Rohingya_Pa" | "He" | "Heh" | "Heh_Goal"
+                 | "Heth"
+                 | "Kaf" | "Kaph" | "Kashmiri_Yeh" | "Khaph"
+                 | "Knotted_Heh"
+                 | "Lam" | "Lamadh"
+                 | "Malayalam_Bha" | "Malayalam_Ja" | "Malayalam_Lla"
+                 | "Malayalam_Llla" | "Malayalam_Nga"
+                 | "Malayalam_Nna" | "Malayalam_Nnna"
+                 | "Malayalam_Nya" | "Malayalam_Ra" | "Malayalam_Ssa"
+                 | "Malayalam_Tta" | "Manichaean_Aleph"
+                 | "Manichaean_Ayin" | "Manichaean_Beth"
+                 | "Manichaean_Daleth" | "Manichaean_Dhamedh"
+                 | "Manichaean_Five" | "Manichaean_Gimel"
+                 | "Manichaean_Heth" | "Manichaean_Hundred"
+                 | "Manichaean_Kaph" | "Manichaean_Lamedh"
+                 | "Manichaean_Mem" | "Manichaean_Nun"
+                 | "Manichaean_One" | "Manichaean_Pe"
+                 | "Manichaean_Qoph" | "Manichaean_Resh"
+                 | "Manichaean_Sadhe" | "Manichaean_Samekh"
+                 | "Manichaean_Taw" | "Manichaean_Ten"
+                 | "Manichaean_Teth" | "Manichaean_Thamedh"
+                 | "Manichaean_Twenty" | "Manichaean_Waw"
+                 | "Manichaean_Yodh" | "Manichaean_Zayin" | "Meem"
+                 | "Mim"
+                 | "No_Joining_Group" | "Noon" | "Nun" | "Nya"
+                 | "Pe"
+                 | "Qaf" | "Qaph"
+                 | "Reh" | "Reversed_Pe" | "Rohingya_Yeh"
+                 | "Sad" | "Sadhe" | "Seen" | "Semkath" | "Shin"
+                 | "Straight_Waw" | "Swash_Kaf" | "Syriac_Waw"
+                 | "Tah" | "Taw" | "Teh_Marbuta" | "Teh_Marbuta_Goal"
+                 | "Teth" | "Thin_Yeh"
+                 | "Vertical_Tail"
+                 | "Waw"
+                 | "Yeh" | "Yeh_Barree" | "Yeh_With_Tail" | "Yudh"
+                 | "Yudh_He"
+                 | "Zain" | "Zhain"
+                 }?
+
+  code-point-attributes &=
+    attribute Join_C { boolean }?
+
+  code-point-attributes &=
+    attribute lb { "AI" | "AK" | "AL" | "AP" | "AS"
+                 | "B2" | "BA" | "BB" | "BK"
+                 | "CB" | "CJ" | "CL" | "CM" | "CP" | "CR"
+                 | "EB" | "EM" | "EX"
+                 | "GL"
+                 | "H2" | "H3" | "HL" | "HY"
+                 | "ID" | "IN" | "IS"
+                 | "JL" | "JT" | "JV"
+                 | "LF"
+                 | "NL" | "NS" | "NU"
+                 | "OP"
+                 | "PO" | "PR"
+                 | "QU"
+                 | "RI"
+                 | "SA" | "SG" | "SP" | "SY"
+                 | "VF" | "VI"
+                 | "WJ"
+                 | "XX"
+                 | "ZW" | "ZWJ"
+                 }?
+
+  code-point-attributes &=
+    attribute ea { "A" | "F" | "H" | "N" | "Na" | "W" }?
+
+  code-point-attributes &=
+    attribute Upper { boolean }?
+
+  code-point-attributes &=
+    attribute Lower { boolean }?
+
+  code-point-attributes &=
+    attribute OUpper { boolean }?
+
+  code-point-attributes &=
+    attribute OLower { boolean }?
+
+  code-point-attributes &=
+    attribute suc { "#" | single-code-point }?
+
+  code-point-attributes &=
+    attribute slc { "#" | single-code-point }?
+
+  code-point-attributes &=
+    attribute stc { "#" | single-code-point }?
+
+  code-point-attributes &=
+    attribute uc { "#" | one-or-more-code-points }?
+
+  code-point-attributes &=
+    attribute lc { "#" | one-or-more-code-points }?
+
+  code-point-attributes &=
+    attribute tc { "#" | one-or-more-code-points }?
+
+  code-point-attributes &=
+    attribute scf { "#" | single-code-point }?
+
+  code-point-attributes &=
+    attribute cf { "#" | one-or-more-code-points }?
+
+  code-point-attributes &=
+    attribute CI { boolean }?
+
+  code-point-attributes &=
+    attribute Cased { boolean }?
+
+  code-point-attributes &=
+    attribute CWCF { boolean }?
+
+  code-point-attributes &=
+    attribute CWCM { boolean }?
+
+  code-point-attributes &=
+    attribute CWL { boolean }?
+
+  code-point-attributes &=
+    attribute CWKCF { boolean }?
+
+  code-point-attributes &=
+    attribute CWT { boolean }?
+
+  code-point-attributes &=
+    attribute CWU { boolean }?
+
+  code-point-attributes &=
+    attribute NFKC_CF { "#" | zero-or-more-code-points }?
+
+  code-point-attributes &=
+    attribute NFKC_SCF { "#" | zero-or-more-code-points }?
+
+  script = "Adlm" | "Aghb" | "Ahom" | "Arab" | "Armi" | "Armn"
+           | "Avst"
+           | "Bali" | "Bamu" | "Bass" | "Batk" | "Beng" | "Bhks"
+           | "Bopo" | "Brah" | "Brai" | "Bugi" | "Buhd"
+           | "Cakm" | "Cans" | "Cari" | "Cham" | "Cher" | "Chrs"
+           | "Copt" | "Cpmn" | "Cprt" | "Cyrl"
+           | "Deva" | "Diak" | "Dogr" | "Dsrt" | "Dupl"
+           | "Egyp" | "Elba" | "Elym" | "Ethi"
+           | "Gara" | "Geor" | "Glag" | "Gong" | "Gonm" | "Goth"
+           | "Gran" | "Grek" | "Gujr" | "Gukh" | "Guru"
+           | "Hang" | "Hani" | "Hano" | "Hatr" | "Hebr" | "Hira"
+           | "Hluw" | "Hmng" | "Hmnp" | "Hrkt" | "Hung"
+           | "Ital"
+           | "Java"
+           | "Kali" | "Kana" | "Kawi" | "Khar" | "Khmr" | "Khoj"
+           | "Kits" | "Knda" | "Krai" | "Kthi"
+           | "Lana" | "Laoo" | "Latn" | "Lepc" | "Limb" | "Lina"
+           | "Linb" | "Lisu" | "Lyci" | "Lydi"
+           | "Mahj" | "Maka" | "Mand" | "Mani" | "Marc" | "Medf"
+           | "Mend" | "Merc" | "Mero" | "Mlym" | "Modi" | "Mong"
+           | "Mroo" | "Mtei" | "Mult" | "Mymr"
+           | "Nagm" | "Nand" | "Narb" | "Nbat" | "Newa" | "Nkoo"
+           | "Nshu"
+           | "Ogam" | "Olck" | "Onao" | "Orkh" | "Orya" | "Osge"
+           | "Osma" | "Ougr"
+           | "Palm" | "Pauc" | "Perm" | "Phag" | "Phli" | "Phlp"
+           | "Phnx" | "Plrd" | "Prti"
+           | "Rjng" | "Rohg" | "Runr"
+           | "Samr" | "Sarb" | "Saur" | "Sgnw" | "Shaw" | "Shrd"
+           | "Sidd" | "Sind" | "Sinh" | "Sogd" | "Sogo" | "Sora"
+           | "Soyo" | "Sund" | "Sunu" | "Sylo" | "Syrc"
+           | "Tagb" | "Takr" | "Tale" | "Talu" | "Taml" | "Tang"
+           | "Tavt" | "Telu" | "Tfng" | "Tglg" | "Thaa" | "Thai"
+           | "Tibt" | "Tirh" | "Tnsa" | "Todr" | "Toto" | "Tutg"
+           | "Ugar"
+           | "Vaii" | "Vith"
+           | "Wara" | "Wcho"
+           | "Xpeo" | "Xsux"
+           | "Yezi" | "Yiii"
+           | "Zanb" | "Zinh" | "Zyyy" | "Zzzz"
+
+  code-point-attributes &=
+    attribute sc { script }?
+
+  code-point-attributes &=
+    attribute scx { list { script + } }?
+
+  code-point-attributes &=
+    attribute isc { text }?
+
+  code-point-attributes &=
+    attribute hst { "L" | "LV" | "LVT" | "NA" | "T" | "V" }?
+
+  code-point-attributes &=
+    attribute JSN { xsd:string { pattern="[A-Z]{0,3}" } }?
+
+  code-point-attributes &=
+    attribute InSC { "Avagraha"
+                   | "Bindu"
+                   | "Brahmi_Joining_Number"
+                   | "Cantillation_Mark"
+                   | "Consonant"
+                   | "Consonant_Dead"
+                   | "Consonant_Final"
+                   | "Consonant_Head_Letter"
+                   | "Consonant_Initial_Postfixed"
+                   | "Consonant_Killer"
+                   | "Consonant_Medial"
+                   | "Consonant_Placeholder"
+                   | "Consonant_Preceding_Repha"
+                   | "Consonant_Prefixed"
+                   | "Consonant_Subjoined"
+                   | "Consonant_Succeeding_Repha"
+                   | "Consonant_With_Stacker"
+                   | "Gemination_Mark"
+                   | "Invisible_Stacker"
+                   | "Joiner"
+                   | "Modifying_Letter"
+                   | "Non_Joiner"
+                   | "Nukta"
+                   | "Number"
+                   | "Number_Joiner"
+                   | "Other"
+                   | "Pure_Killer"
+                   | "Register_Shifter"
+                   | "Reordering_Killer"
+                   | "Syllable_Modifier"
+                   | "Tone_Letter"
+                   | "Tone_Mark"
+                   | "Virama"
+                   | "Visarga"
+                   | "Vowel"
+                   | "Vowel_Dependent"
+                   | "Vowel_Independent"
+                   }?
+
+  code-point-attributes &=
+    attribute InPC { "Bottom"
+                   | "Bottom_And_Left"
+                   | "Bottom_And_Right"
+                   | "Left"
+                   | "Left_And_Right"
+                   | "NA"
+                   | "Overstruck"
+                   | "Right"
+                   | "Top"
+                   | "Top_And_Bottom"
+                   | "Top_And_Bottom_And_Left"
+                   | "Top_And_Bottom_And_Right"
+                   | "Top_And_Left"
+                   | "Top_And_Left_And_Right"
+                   | "Top_And_Right"
+                   | "Visual_Order_Left"
+                   }?
+
+  code-point-attributes &=
+    attribute InCB { "Consonant"
+                   | "Extend"
+                   | "Linker"
+                   | "None"
+                   }?
+
+  code-point-attributes &=
+    attribute IDS { boolean }?
+
+  code-point-attributes &=
+    attribute OIDS { boolean }?
+
+  code-point-attributes &=
+    attribute XIDS { boolean }?
+
+  code-point-attributes &=
+    attribute IDC { boolean }?
+
+  code-point-attributes &=
+    attribute OIDC { boolean }?
+
+  code-point-attributes &=
+    attribute XIDC { boolean }?
+
+  code-point-attributes &=
+    attribute ID_Compat_Math_Start { boolean }?
+
+  code-point-attributes &=
+    attribute ID_Compat_Math_Continue { boolean }?
+
+  code-point-attributes &=
+    attribute Pat_Syn { boolean }?
+
+  code-point-attributes &=
+    attribute Pat_WS { boolean }?
+
+  code-point-attributes &=
+    attribute Dash { boolean }?
+
+  code-point-attributes &=
+    attribute Hyphen { boolean }?
+
+  code-point-attributes &=
+    attribute QMark { boolean }?
+
+  code-point-attributes &=
+    attribute Term { boolean }?
+
+  code-point-attributes &=
+    attribute STerm { boolean }?
+
+  code-point-attributes &=
+    attribute Dia { boolean }?
+
+  code-point-attributes &=
+    attribute Ext { boolean }?
+
+  code-point-attributes &=
+    attribute SD { boolean }?
+
+  code-point-attributes &=
+    attribute Alpha { boolean }?
+
+  code-point-attributes &=
+    attribute OAlpha { boolean }?
+
+  code-point-attributes &=
+    attribute Math { boolean }?
+
+  code-point-attributes &=
+    attribute OMath { boolean }?
+
+  code-point-attributes &=
+    attribute Hex { boolean }?
+
+  code-point-attributes &=
+    attribute AHex { boolean }?
+
+  code-point-attributes &=
+    attribute DI { boolean }?
+
+  code-point-attributes &=
+    attribute ODI { boolean }?
+
+  code-point-attributes &=
+    attribute LOE { boolean }?
+
+  code-point-attributes &=
+    attribute PCM { boolean }?
+
+  code-point-attributes &=
+    attribute MCM { boolean }?
+
+  code-point-attributes &=
+    attribute WSpace { boolean }?
+
+  code-point-attributes &=
+    attribute vo { "R" | "Tr" | "Tu" | "U" }?
+
+  code-point-attributes &=
+    attribute RI { boolean }?
+
+  code-point-attributes &=
+    attribute Gr_Base { boolean }?
+
+  code-point-attributes &=
+    attribute Gr_Ext { boolean }?
+
+  code-point-attributes &=
+    attribute OGr_Ext { boolean }?
+
+  code-point-attributes &=
+    attribute Gr_Link { boolean }?
+
+  code-point-attributes &=
+    attribute GCB { "CN" | "CR"
+                  | "EB" | "EBG" | "EM" | "EX"
+                  | "GAZ"
+                  | "L" | "LF" | "LV" | "LVT"
+                  | "PP"
+                  | "RI"
+                  | "SM"
+                  | "T"
+                  | "V"
+                  | "XX"
+                  | "ZWJ"
+                  }?
+
+  code-point-attributes &=
+    attribute WB { "CR"
+                 | "DQ"
+                 | "EB" | "EBG" | "EM" | "EX" | "Extend"
+                 | "FO"
+                 | "GAZ"
+                 | "HL"
+                 | "KA"
+                 | "LE" | "LF"
+                 | "MB" | "ML" | "MN"
+                 | "NL" | "NU"
+                 | "RI"
+                 | "SQ"
+                 | "WSegSpace"
+                 | "XX"
+                 | "ZWJ"
+                 }?
+
+  code-point-attributes &=
+    attribute SB { "AT"
+                 | "CL" | "CR"
+                 | "EX"
+                 | "FO"
+                 | "LE" | "LF" | "LO"
+                 | "NU"
+                 | "SC" | "SE" | "SP" | "ST"
+                 | "UP"
+                 | "XX"
+                 }?
+
+  code-point-attributes &=
+    attribute Ideo { boolean }?
+
+  code-point-attributes &=
+    attribute UIdeo { boolean }?
+
+  code-point-attributes &=
+    attribute EqUIdeo { single-code-point }?
+
+  code-point-attributes &=
+    attribute IDSB { boolean }?
+
+  code-point-attributes &=
+    attribute IDST { boolean }?
+
+  code-point-attributes &=
+    attribute IDSU { boolean }?
+
+  code-point-attributes &=
+    attribute Radical { boolean }?
+
+  code-point-attributes &=
+    attribute Dep { boolean }?
+
+  code-point-attributes &=
+    attribute VS { boolean }?
+
+  code-point-attributes &=
+    attribute NChar { boolean }?
+
+  code-point-attributes &= attribute kAccountingNumeric
+    { xsd:string { pattern="[0-9]+" } }?
+
+  code-point-attributes &= attribute kAlternateTotalStrokes
+    { list { xsd:string { pattern="(\d+:[BHJKMPSUV]+)|-" }+ } }?
+
+  code-point-attributes &= attribute kBigFive
+    { xsd:string { pattern="[0-9A-F]{4}'?" } }?
+
+  code-point-attributes &= attribute kCangjie
+    { xsd:string { pattern="[A-Z]+" } }?
+
+  code-point-attributes &= attribute kCantonese
+    { list { xsd:string { pattern="[a-z]{1,6}[1-6]" }+ } }?
+
+  code-point-attributes &= attribute kCCCII
+    { list { xsd:string { pattern="[0-9A-F]{6}" }+ } }?
+
+  code-point-attributes &= attribute kCheungBauer
+    { list { xsd:string { pattern="[0-9]{3}/[0-9]{2};[A-Z]*;[a-z1-6\[\]/,]+" }+ } }?
+
+  code-point-attributes &= attribute kCheungBauerIndex
+    { list { xsd:string { pattern="[0-9]{3}\.[01][0-9]" }+ } }?
+
+  code-point-attributes &= attribute kCihaiT
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}\.[0-9]{3}" }+ } }?
+
+  code-point-attributes &= attribute kCNS1986
+    { xsd:string { pattern="[12E]-[0-9A-F]{4}" } }?
+
+  code-point-attributes &= attribute kCNS1992
+    { xsd:string { pattern="[1-9]-[0-9A-F]{4}" } }?
+
+  code-point-attributes &= attribute kCompatibilityVariant
+    { "" | xsd:string { pattern="U\+[23]?[0-9A-F]{4}" } }?
+
+  code-point-attributes &= attribute kCowles
+    { list { xsd:string { pattern="[0-9]{1,4}(\.[0-9]{1,2})?" }+ } }?
+
+  code-point-attributes &= attribute kDaeJaweon
+    { xsd:string { pattern="[0-9]{4}\.[0-9]{2}[01]" } }?
+
+  code-point-attributes &= attribute kDefinition
+    { xsd:string { pattern='[^\t"]+' } }?
+
+  code-point-attributes &= attribute kEACC
+    { xsd:string { pattern="[0-9A-F]{6}" } }?
+
+  code-point-attributes &= attribute kFanqie
+    { list { xsd:string { pattern="[\x{3400}-\x{4DBF}\x{4E00}-\x{9FFF}\x{20000}-\x{2A6DF}]{2}" }+ } }?
+
+  code-point-attributes &= attribute kFenn
+    { list { xsd:string { pattern="[0-9]+a?[A-KP*]" }+ } }?
+
+  code-point-attributes &= attribute kFennIndex
+    { list { xsd:string { pattern="[0-9][0-9]{0,2}\.[01][0-9]" }+ } }?
+
+  code-point-attributes &= attribute kFourCornerCode
+    { list { xsd:string { pattern="[0-9]{4}(\.[0-9])?" }+ } }?
+
+  code-point-attributes &= attribute kGB0
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &= attribute kGB1
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &= attribute kGB3
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &= attribute kGB5
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &= attribute kGB7
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &= attribute kGB8
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &= attribute kGradeLevel
+    { xsd:string { pattern="[1-6]" } }?
+
+  code-point-attributes &= attribute kGSR
+    { list { xsd:string { pattern="[0-9]{4}[a-vx-z]'?" }+ } }?
+
+  code-point-attributes &= attribute kHangul
+    { list { xsd:string { pattern="[\x{1100}-\x{1112}][\x{1161}-\x{1175}][\x{11A8}-\x{11C2}]?:[01ENX]{1,3}" }+ } }?
+
+  code-point-attributes &= attribute kHanYu
+    { list { xsd:string { pattern="[1-8][0-9]{4}\.[0-3][0-9][0-3]" }+ } }?
+
+  code-point-attributes &= attribute kHanyuPinlu
+    { list { xsd:string { pattern="[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+\([0-9]+\)" }+ } }?
+
+  code-point-attributes &= attribute kHanyuPinyin
+    { list { xsd:string { pattern="(\d{5}\.\d{2}0,)*\d{5}\.\d{2}0:([a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+,)*[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &= attribute kHDZRadBreak
+    { xsd:string { pattern="[\x{2F00}-\x{2FD5}]\[U\+2F[0-9A-D][0-9A-F]\]:[1-8][0-9]{4}\.[0-3][0-9]0" } }?
+
+  code-point-attributes &= attribute kHKGlyph
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &= attribute kIBMJapan
+    { list { xsd:string { pattern="F[ABC][0-9A-F]{2}" }+ } }?
+
+  code-point-attributes &= attribute kIICore
+    { list { xsd:string { pattern="[ABC][GHJKMPT]{1,7}" }+ } }?
+
+  code-point-attributes &= attribute kIRG_GSource
+    { "" | xsd:string { pattern="G[013578EKS]-[0-9A-F]{4}" }
+         | xsd:string { pattern="G4K(-\d{5})?" }
+         | xsd:string { pattern="G(DZ|GH|RM|WZ|XC|XH|ZH)-\d{4}\.\d{2}" }
+         | xsd:string { pattern="G(BK|CH|CY|HC)(-\d{4}\.\d{2})?" }
+         | xsd:string { pattern="GKX-\d{4}\.\d{2,3}" }
+         | xsd:string { pattern="G(HZ|HZR)-\d{5}\.\d{2}" }
+         | xsd:string { pattern="G(CE|FC|IDC23|OCD|XHZ)-\d{3}" }
+         | xsd:string { pattern="G(H|HF|LGYJ|PGLG|T)-\d{4}" }
+         | xsd:string { pattern="G(CYY|DM|JZ|KJ|XM|ZFY|ZJW|ZYS)-\d{5}" }
+         | xsd:string { pattern="G(FZ|IDC)-[0-9A-F]{4}" }
+         | xsd:string { pattern="GGFZ-\d{6}" }
+         | xsd:string { pattern="G(LK|Z)-\d{7}" }
+         | xsd:string { pattern="GU-[023][0-9A-F]{4}" }
+         | xsd:string { pattern="GZA-[123467]\d{5}" }
+    }?
+
+  code-point-attributes &= attribute kIRG_HSource
+    { "" | xsd:string { pattern="H-[0-9A-F]{4}" }
+         | xsd:string { pattern="H(B[012])-[0-9A-F]{4}" }
+         | xsd:string { pattern="HD-[23]?[0-9A-F]{4}" }
+         | xsd:string { pattern="HU-[023][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &= attribute kIRG_JSource
+    { "" | xsd:string { pattern="J[014]-[0-9A-F]{4}" }
+         | xsd:string { pattern="J3A?-[0-9A-F]{4}" }
+         | xsd:string { pattern="J13A?-[0-9A-F]{4}" }
+         | xsd:string { pattern="J14-[0-9A-F]{4}" }
+         | xsd:string { pattern="JA[34]?-[0-9A-F]{4}" }
+         | xsd:string { pattern="JARIB-[0-9A-F]{4}" }
+         | xsd:string { pattern="JH-(JT[ABC][0-9A-F]{3}S?|IB\d{4}|\d{6})" }
+         | xsd:string { pattern="JK-\d{5}" }
+         | xsd:string { pattern="JMJ-\d{6}" }
+    }?
+
+  code-point-attributes &= attribute kIRG_KPSource
+    { "" | xsd:string { pattern="KP([01]-[0-9A-F]{4}|U-[023][0-9A-F]{4})" } }?
+
+  code-point-attributes &= attribute kIRG_KSource
+    { "" | xsd:string { pattern="K[0-6]-[0-9A-F]{4}" }
+         | xsd:string { pattern="KC-\d{5}" }
+         | xsd:string { pattern="KU-[023][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &= attribute kIRG_MSource
+    { "" | xsd:string { pattern="MA-[0-9A-F]{4}" }
+         | xsd:string { pattern="MB[12]-[0-9A-F]{4}" }
+         | xsd:string { pattern="MC-\d{5}" }
+         | xsd:string { pattern="MDH?-[23]?[0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &= attribute kIRG_SSource
+    { "" | xsd:string { pattern="SAT-\d{5}" } }?
+
+  code-point-attributes &= attribute kIRG_TSource
+    { "" | xsd:string { pattern="T([1-7A-F]|1[1-3])-[0-9A-F]{4}" }
+         | xsd:string { pattern="TU-[023][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &= attribute kIRG_UKSource
+    { "" | xsd:string { pattern="UK-\d{5}" } }?
+
+  code-point-attributes &= attribute kIRG_USource
+    { "" | xsd:string { pattern="UTC-\d{5}" } }?
+
+  code-point-attributes &= attribute kIRG_VSource
+    { "" | xsd:string { pattern="V[0-4]-[0-9A-F]{4}" }
+         | xsd:string { pattern="VN-[023F][0-9A-F]{4}" }
+    }?
+
+  code-point-attributes &= attribute kIRGDaeJaweon
+    { list { xsd:string { pattern="[0-9]{4}\.[0-9]{2}[01]" }+ } }?
+
+  code-point-attributes &= attribute kIRGHanyuDaZidian
+    { list { xsd:string { pattern="[1-8][0-9]{4}\.[0-3][0-9][01]" }+ } }?
+
+  code-point-attributes &= attribute kIRGKangXi
+    { list { xsd:string { pattern="[01][0-9]{3}\.[0-7][0-9][01]" }+ } }?
+
+  code-point-attributes &= attribute kJa
+    { list { xsd:string { pattern="[0-9A-F]{4}S?" }+ } }?
+
+  code-point-attributes &= attribute kJapanese
+    { list { xsd:string { pattern="[\x{3041}-\x{3096}\x{3099}\x{309A}\x{30A1}-\x{30FA}\x{30FC}]+" }+ } }?
+
+  code-point-attributes &= attribute kJapaneseKun
+    { list { xsd:string { pattern="[A-Z]+" }+ } }?
+
+  code-point-attributes &= attribute kJapaneseOn
+    { list { xsd:string { pattern="[A-Z]+" }+ } }?
+
+  code-point-attributes &= attribute kJinmeiyoKanji
+    { list { xsd:string { pattern="(20[0-9]{2})(:U\+[23]?[0-9A-F]{4})?" }+ } }?
+
+  code-point-attributes &= attribute kJis0
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &= attribute kJis1
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &= attribute kJIS0213
+    { list { xsd:string { pattern="[12],[0-9]{2},[0-9]{1,2}" }+ } }?
+
+  code-point-attributes &= attribute kJoyoKanji
+    { list { xsd:string { pattern="(20[0-9]{2})|(U\+[23]?[0-9A-F]{4})" }+ } }?
+
+  code-point-attributes &= attribute kKangXi
+    { list { xsd:string { pattern="[0-9]{4}\.[0-9]{2}[01]" }+ } }?
+
+  code-point-attributes &= attribute kKarlgren
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}[A*]?" }+ } }?
+
+  code-point-attributes &= attribute kKorean
+    { list { xsd:string { pattern="[A-Z]+" }+ } }?
+
+  code-point-attributes &= attribute kKoreanEducationHanja
+    { list { xsd:string { pattern="20[0-9]{2}" }+ } }?
+
+  code-point-attributes &= attribute kKoreanName
+    { list { xsd:string { pattern="20[0-9]{2}" }+ } }?
+
+  code-point-attributes &= attribute kLau
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}" }+ } }?
+
+  code-point-attributes &= attribute kMainlandTelegraph
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &= attribute kMandarin
+    { list { xsd:string { pattern="[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &= attribute kMatthews
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}(a|\.5)?" }+ } }?
+
+  code-point-attributes &= attribute kMeyerWempe
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}[a-t*]?" }+ } }?
+
+  code-point-attributes &= attribute kMojiJoho
+    { list { xsd:string { pattern="MJ\d{6}(:(FE0[01]|E01[01][0-9A-F]))?" }+ } }?
+
+  code-point-attributes &= attribute kMorohashi
+    { list { xsd:string { pattern="(\d{5}'{0,2}|H\d{3})(:(FE0[01]|E010[0-9A-F]))?" }+ } }?
+
+  code-point-attributes &= attribute kNelson
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &= attribute kOtherNumeric
+    { list { xsd:string { pattern="[0-9]+" }+ } }?
+
+  code-point-attributes &= attribute kPhonetic
+    { list { xsd:string { pattern="[1-9][0-9]{0,3}[A-D]?\*?" }+ } }?
+
+  code-point-attributes &= attribute kPrimaryNumeric
+    { list { xsd:string { pattern="[0-9]+" }+ } }?
+
+  code-point-attributes &= attribute kPseudoGB1
+    { xsd:string { pattern="[0-9]{4}" } }?
+
+  code-point-attributes &= attribute kRSAdobe_Japan1_6
+    { list { xsd:string { pattern="[CV]\+[0-9]{1,5}\+[1-9][0-9]{0,2}\.[1-9][0-9]?\.[0-9]{1,2}" }+ } }?
+
+  code-point-attributes &= attribute kRSUnicode
+    { list { xsd:string { pattern="[1-9][0-9]{0,2}'{0,3}\.-?[0-9]{1,2}" }+ } }?
+
+  code-point-attributes &= attribute kSBGY
+    { list { xsd:string { pattern="[0-9]{3}\.[0-7][0-9]" }+ } }?
+
+  code-point-attributes &= attribute kSemanticVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}(<[ks][A-Za-z0-9_]+(:[TBZFJ]+)?(,[ks][A-Za-z0-9_]+(:[TBZFJ]+)?)*)?" }+ } }?
+
+  code-point-attributes &= attribute kSimplifiedVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}" }+ } }?
+
+  code-point-attributes &= attribute kSMSZD2003Index
+    { list { xsd:string { pattern="\d{1,3}\.\d{2}" }+ } }?
+
+  code-point-attributes &= attribute kSMSZD2003Readings
+    { list { xsd:string { pattern="[a-z\x{300}\x{301}\x{302}\x{304}\x{308}\x{30C}]+(,[a-z\x{300}\x{301}\x{302}\x{304}\x{308}\x{30C}]+)*\x{7CB5}[a-z]+[1-6]([a-z]+[1-6])?(,[a-z]+[1-6]([a-z]+[1-6])?)*" }+ } }?
+
+  code-point-attributes &= attribute kSpecializedSemanticVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}(<[ks][A-Za-z0-9_]+(:[TBZFJ]+)?(,[ks][A-Za-z0-9_]+(:[TBZFJ]+)?)*)?" }+ } }?
+
+  code-point-attributes &= attribute kSpoofingVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}" }+ } }?
+
+  code-point-attributes &= attribute kStrange
+    { list { ( xsd:string { pattern="[ACU]" }
+             | xsd:string { pattern="B:U\+31[0-2AB][0-9A-F]" }
+             | xsd:string { pattern="[FMOR](:U\+[23]?[0-9A-F]{4})?" }
+             | xsd:string { pattern="H:U\+31[3-8][0-9A-F]" }
+             | xsd:string { pattern="I(:U\+[23]?[0-9A-F]{4})*" }
+             | xsd:string { pattern="K(:U\+30[A-F][0-9A-F])+" }
+             | xsd:string { pattern="S:[4-9][0-9]" }
+    )+}}?
+
+  code-point-attributes &= attribute kTaiwanTelegraph
+    { list { xsd:string { pattern="[0-9]{4}" }+ } }?
+
+  code-point-attributes &= attribute kTang
+    { list { xsd:string { pattern="\*?[A-Za-z()\x{E6}\x{251}\x{259}\x{25B}\x{300}\x{30C}]+" }+ } }?
+
+  code-point-attributes &= attribute kTGH
+    { list { xsd:string { pattern="20[0-9]{2}:[1-9][0-9]{0,3}" }+ } }?
+
+  code-point-attributes &= attribute kTGHZ2013
+    { list { xsd:string { pattern="[0-9]{3}\.[0-9]{3}(,[0-9]{3}\.[0-9]{3})*:[a-z\x{300}-\x{302}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &= attribute kTotalStrokes
+    { list { xsd:string { pattern="[1-9][0-9]{0,2}" }+ } }?
+
+  code-point-attributes &= attribute kTraditionalVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}" }+ } }?
+
+  code-point-attributes &= attribute kUnihanCore2020
+    { xsd:string { pattern="[GHJKMPT]{1,7}" } }?
+
+  code-point-attributes &= attribute kVietnamese
+    { list { xsd:string { pattern="[A-Za-z\x{110}\x{111}\x{300}-\x{303}\x{306}\x{309}\x{31B}\x{323}]+" }+ } }?
+
+  code-point-attributes &= attribute kVietnameseNumeric
+    { list { xsd:string { pattern="\d+" }+ } }?
+
+  code-point-attributes &= attribute kXerox
+    { list { xsd:string { pattern="[0-9]{3}:[0-9]{3}" }+ } }?
+
+  code-point-attributes &= attribute kXHC1983
+    { list { xsd:string { pattern="[0-9]{4}\.[0-9]{3}\*?(,[0-9]{4}\.[0-9]{3}\*?)*:[a-z\x{300}\x{301}\x{304}\x{308}\x{30C}]+" }+ } }?
+
+  code-point-attributes &= attribute kZhuang
+    { list { xsd:string { pattern="[a-z]+\*?" }+ } }?
+
+  code-point-attributes &= attribute kZhuangNumeric
+    { list { xsd:string { pattern="\d+" }+ } }?
+
+  code-point-attributes &= attribute kZVariant
+    { list { xsd:string { pattern="U\+[23]?[0-9A-F]{4}(<[ks][A-Za-z0-9_]+(:[TBZ]+)?(,[ks][A-Za-z0-9_]+(:[TBZ]+)?)*)?" }+ } }?
+
+      
+  code-point-attributes &=
+    attribute kRSTUnicode { xsd:string { pattern="[0-9]+\.[0-9]+" } }?
+
+  code-point-attributes &=
+    attribute kTGT_MergedSrc 
+     { xsd:string {pattern="L2008-[0-9A-F]{4,5}(-[0-9]{4,5})?"}
+     | xsd:string {pattern="L2006-[0-9]{4}"}
+     | xsd:string {pattern="L1997-[0-9]{4}"}
+     | xsd:string {pattern="L1986-[0-9]{4}"}
+     | xsd:string {pattern="S1968-[0-9]{4}"}
+     | xsd:string {pattern="N1966-[0-9]{3}(-[0-9A-Z]{3,4})?"}
+     | xsd:string {pattern="H2004-[A-Z]-[0-9]{4}"}
+     | xsd:string {pattern="L2012-[0-9]{4}"}
+     | xsd:string {pattern="UTN42-[0-9]{3}"}
+     }?
+
+      
+  code-point-attributes &=
+    attribute kSrc_NushuDuben { xsd:string { pattern="[0-9]+\.[0-9]+" } }?
+
+  code-point-attributes &=
+    attribute kReading { xsd:string }?
+
+      
+  ucd.content &=
+    element blocks {
+      element block {
+        attribute first-cp { single-code-point },
+        attribute last-cp { single-code-point },
+        attribute name { text } }+ }?
+
+      
+  ucd.content &=
+    element named-sequences {
+      element named-sequence {
+        attribute cps { one-or-more-code-points },
+        attribute name { text } }+ }?
+
+  ucd.content &=
+    element provisional-named-sequences {
+      element named-sequence {
+        attribute cps { one-or-more-code-points },
+        attribute name { text } }+ }?
+
+      
+  ucd.content &=
+    element normalization-corrections {
+      element normalization-correction {
+        attribute cp { single-code-point },
+        attribute old { one-or-more-code-points },
+        attribute new { one-or-more-code-points },
+        attribute version { text } }+ }?
+
+      
+  ucd.content &=
+    element standardized-variants {
+      element standardized-variant {
+        attribute cps { two-code-points },
+        attribute desc { text },
+        attribute when { text } }+ }?
+
+      
+  ucd.content &=
+    element cjk-radicals {
+      element cjk-radical {
+        attribute number { xsd:string {pattern="[0-9]{1,3}'{0,3}"}},
+        attribute radical { single-code-point? },
+        attribute ideograph { single-code-point } }+ }?
+
+      
+  ucd.content &=
+    element emoji-sources {
+      element emoji-source {
+        attribute unicode { one-or-more-code-points },
+        attribute docomo { jis-code-point? },
+        attribute kddi { jis-code-point? },
+        attribute softbank { jis-code-point? } }+ }?
+
+      
+  code-point-attributes &=
+    attribute Emoji { boolean }?
+
+  code-point-attributes &=
+    attribute EPres { boolean }?
+
+  code-point-attributes &=
+    attribute EMod { boolean }?
+
+  code-point-attributes &=
+    attribute EBase { boolean }?
+
+  code-point-attributes &=
+    attribute EComp { boolean }?
+
+  code-point-attributes &=
+    attribute ExtPict { boolean }?
+
+      
+  ucd.content &=
+    element do-not-emit {
+      element instead {
+        attribute of { one-or-more-code-points },
+        attribute use { one-or-more-code-points },
+        attribute because { "Bengali_Khanda_Ta"
+                          | "Deprecated"
+                          | "Discouraged"
+                          | "Dotless_Form"
+                          | "Hamza_Form"
+                          | "Indic_Atomic_Consonant"
+                          | "Indic_Consonant_Conjunct"
+                          | "Indic_Vowel_Letter"
+                          | "Malayalam_Chillu"
+                          | "Precomposed_Form"
+                          | "Precomposed_Hieroglyph"
+                          | "Preferred_Spelling"
+                          | "Tamil_Shrii"
+      } }+ }?
+
diff --git a/unicodetools/src/main/resources/org/unicode/uax42/pom.xml b/unicodetools/src/main/resources/org/unicode/uax42/pom.xml
new file mode 100644
index 000000000..9ae81d56f
--- /dev/null
+++ b/unicodetools/src/main/resources/org/unicode/uax42/pom.xml
@@ -0,0 +1,72 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+	<modelVersion>4.0.0</modelVersion>
+
+	<artifactId>uax42</artifactId>
+	<name>Unicode Standard Annex #42</name>
+
+
+	<parent>
+		<groupId>org.unicode.unicodetools</groupId>
+		<artifactId>unicodetools-parent</artifactId>
+		<version>1.0.0</version>
+	</parent>
+
+	<build>
+		<plugins>
+			<plugin>
+				<groupId>org.codehaus.mojo</groupId>
+				<artifactId>xml-maven-plugin</artifactId>
+				<version>1.1.0</version>
+				<executions>
+					<execution>
+						<goals>
+							<goal>transform</goal>
+						</goals>
+					</execution>
+				</executions>
+				<configuration>
+					<transformationSets>
+						<transformationSet>
+							<dir>${project.basedir}</dir>
+							<xincludeAware>true</xincludeAware>
+							<includes>
+								<include>index.xml</include>
+							</includes>
+							<stylesheet>index2html.xsl</stylesheet>
+							<outputDir>${outputdir}</outputDir>
+							<fileMappers>
+								<fileMapper implementation="org.codehaus.plexus.components.io.filemappers.FileExtensionMapper">
+									<targetExtension>.html</targetExtension>
+								</fileMapper>
+							</fileMappers>
+						</transformationSet>
+						<transformationSet>
+							<dir>${project.basedir}</dir>
+							<xincludeAware>true</xincludeAware>
+							<includes>
+								<include>index.xml</include>
+							</includes>
+							<stylesheet>index2rnc.xsl</stylesheet>
+							<outputDir>${outputdir}</outputDir>
+							<fileMappers>
+								<fileMapper implementation="org.codehaus.plexus.components.io.filemappers.FileExtensionMapper">
+									<targetExtension>.rnc</targetExtension>
+								</fileMapper>
+							</fileMappers>
+						</transformationSet>
+					</transformationSets>
+				</configuration>
+				<dependencies>
+					<dependency>
+						<groupId>net.sf.saxon</groupId>
+						<artifactId>Saxon-HE</artifactId>
+						<version>12.4</version>
+					</dependency>
+				</dependencies>
+			</plugin>
+		</plugins>
+	</build>
+
+</project>
diff --git a/unicodetools/src/test/java/org/unicode/unittest/TestLocaleConstruction.java b/unicodetools/src/test/java/org/unicode/unittest/TestLocaleConstruction.java
index eb31c0452..9b6dd4983 100644
--- a/unicodetools/src/test/java/org/unicode/unittest/TestLocaleConstruction.java
+++ b/unicodetools/src/test/java/org/unicode/unittest/TestLocaleConstruction.java
@@ -377,7 +377,8 @@ void buildLocale(Multimap<String, String> args) {
     ////        AliasesFull aliases = new AliasesFull(dataType);
     ////        Output<Collection<ExceptionInfo>> exception = new Output<>();
     ////
-    ////        for (Entry<Datasubtype, ValiditySet> entry : validityInfo.get(dataType).entrySet())
+    ////        for (Entry<Datasubtype, ValiditySet> entry :
+    // validityInfo.get(dataType).entrySet())
     // {
     ////            for (String code : entry.getValue().regularData) {
     ////                String replacement = aliases.getCanonical(
@@ -388,7 +389,8 @@ void buildLocale(Multimap<String, String> args) {
     ////                if (replacement != null) {
     ////                    if (DEBUG) System.out.println(code + " ==> " + replacement);
     ////                } else if (exception.value != null){
-    ////                    if (DEBUG) System.out.println(code + " ==> " + exception.toString());
+    ////                    if (DEBUG) System.out.println(code + " ==> " +
+    // exception.toString());
     ////                }
     ////            }
     ////        }

Version	+ Unicode + + + + +
+ + + Editor + + + Editors + + +	+ +
Date	+ + + + +
This Version	+ + + + +
Previous Version	+ + + n/a + + + + + + + + +
Latest Version	+ +
Latest Proposed Update	+ proposed.html +
Schema	+ + + + +
Revision	+ + + + + + +
Version	Unicode 16.0.0 +
+ Editor +	+ John Wilcock +
Date	+ 2024-08-15 +
This Version	+ + https://www.unicode.org/reports/tr42/tr42-36.html + +
Previous Version	+ + https://www.unicode.org/reports/tr42/tr42-34.html + +
Latest Version	+ https://www.unicode.org/reports/tr42/ +
Latest Proposed Update	+ https://www.unicode.org/reports/tr42/proposed.html +
Schema	+ + https://www.unicode.org/reports/tr42/tr42-36.rnc + +
Revision	+ + 36 + +