Ejemplo n.º 1
0
        private static async Task ProcessUnihanNumericValues(IDataSource unihanDataSource, UnicodeInfoBuilder builder)
        {
            using (var reader = new UnihanDataFileReader(await unihanDataSource.OpenDataFileAsync(UnihanNumericValuesFileName).ConfigureAwait(false)))
            {
                while (reader.Read())
                {
                    var entry = builder.GetUnihan(reader.CodePoint);

                    switch (reader.PropertyName)
                    {
                    case UnihanProperty.AccountingNumeric:
                        entry.NumericType = UnihanNumericType.Accounting;
                        break;

                    case UnihanProperty.OtherNumeric:
                        entry.NumericType = UnihanNumericType.Other;
                        break;

                    case UnihanProperty.PrimaryNumeric:
                        entry.NumericType = UnihanNumericType.Primary;
                        break;

                    default:
                        throw new InvalidDataException("Unrecognized property name: " + reader.PropertyName + ".");
                    }

                    entry.NumericValue = long.Parse(reader.PropertyValue);
                }
            }
        }
Ejemplo n.º 2
0
        private static async Task ProcessUnihanIrgSources(IDataSource unihanDataSource, UnicodeInfoBuilder builder)
        {
            using (var reader = new UnihanDataFileReader(await unihanDataSource.OpenDataFileAsync(UnihanIrgSourcesFileName).ConfigureAwait(false)))
            {
                while (reader.Read())
                {
                    switch (reader.PropertyName)
                    {
                    case UnihanProperty.RSUnicode:
                        var entry  = builder.GetUnihan(reader.CodePoint);
                        var values = reader.PropertyValue.Split(' ');

                        foreach (string value in values)
                        {
                            bool isSimplified = false;
                            int  index;

                            for (int i = 0; i < value.Length; ++i)
                            {
                                switch (value[i])
                                {
                                case '\'':
                                    isSimplified = true;
                                    goto case '.';

                                case '.':
                                    index = i;
                                    goto SeparatorFound;
                                }
                            }
                            throw new InvalidDataException("Failed to decode value for kRSUnicode / Unicode_Radical_Stroke.");

                            SeparatorFound :;
                            entry.UnicodeRadicalStrokeCounts.Add(new UnicodeRadicalStrokeCount(byte.Parse(value.Substring(0, index), NumberStyles.None), sbyte.Parse(value.Substring(index + (isSimplified ? 2 : 1)), NumberStyles.AllowLeadingSign), isSimplified));
                        }
                        break;

                    default:
                        // Ignore unhandled properties for now.
                        break;
                    }
                }
            }
        }
Ejemplo n.º 3
0
        private static async Task ProcessUnihanVariants(IDataSource unihanDataSource, UnicodeInfoBuilder builder)
        {
            using (var reader = new UnihanDataFileReader(await unihanDataSource.OpenDataFileAsync(UnihanVariantsFileName).ConfigureAwait(false)))
            {
                while (reader.Read())
                {
                    // This statement is used to skip unhandled properties entirely.
                    switch (reader.PropertyName)
                    {
                    case UnihanProperty.SimplifiedVariant:
                    case UnihanProperty.TraditionalVariant:
                        break;

                    default:
                        // Ignore unhandled properties for now.
                        continue;
                    }

                    var entry = builder.GetUnihan(reader.CodePoint);

                    switch (reader.PropertyName)
                    {
                    case UnihanProperty.SimplifiedVariant:
                        entry.SimplifiedVariant = char.ConvertFromUtf32(HexCodePoint.ParsePrefixed(reader.PropertyValue));
                        break;

                    case UnihanProperty.TraditionalVariant:
                        entry.TraditionalVariant = char.ConvertFromUtf32(HexCodePoint.ParsePrefixed(reader.PropertyValue));
                        break;

                    default:
                        throw new InvalidOperationException();
                    }
                }
            }
        }
Ejemplo n.º 4
0
        private static async Task ProcessUnihanReadings(IDataSource unihanDataSource, UnicodeInfoBuilder builder)
        {
            using (var reader = new UnihanDataFileReader(await unihanDataSource.OpenDataFileAsync(UnihanReadingsFileName).ConfigureAwait(false)))
            {
                while (reader.Read())
                {
                    // This statement is used to skip unhandled properties entirely.
                    switch (reader.PropertyName)
                    {
                    case UnihanProperty.Definition:
                    case UnihanProperty.Mandarin:
                    case UnihanProperty.Cantonese:
                    case UnihanProperty.JapaneseKun:
                    case UnihanProperty.JapaneseOn:
                    case UnihanProperty.Korean:
                    case UnihanProperty.Hangul:
                    case UnihanProperty.Vietnamese:
                        break;

                    default:
                        // Ignore unhandled properties for now.
                        continue;
                    }

                    // This entry will only be created if there is meaningful data.
                    var entry = builder.GetUnihan(reader.CodePoint);

                    switch (reader.PropertyName)
                    {
                    case UnihanProperty.Definition:
                        entry.Definition = reader.PropertyValue;
                        break;

                    case UnihanProperty.Mandarin:
                        entry.MandarinReading = reader.PropertyValue;
                        break;

                    case UnihanProperty.Cantonese:
                        entry.CantoneseReading = reader.PropertyValue;
                        break;

                    case UnihanProperty.JapaneseKun:
                        entry.JapaneseKunReading = reader.PropertyValue;
                        break;

                    case UnihanProperty.JapaneseOn:
                        entry.JapaneseOnReading = reader.PropertyValue;
                        break;

                    case UnihanProperty.Korean:
                        entry.KoreanReading = reader.PropertyValue;
                        break;

                    case UnihanProperty.Hangul:
                        entry.HangulReading = reader.PropertyValue;
                        break;

                    case UnihanProperty.Vietnamese:
                        entry.VietnameseReading = reader.PropertyValue;
                        break;

                    default:
                        throw new InvalidOperationException();
                    }
                }
            }
        }