示例#1
0
文件: index.cs 项目: reactxx/rewise
    public static void Build()
    {
        Console.WriteLine("CldrDesignLib.RefreshCldrDataSource");
        CldrDesignLib.RefreshCldrDataSource();

        Console.WriteLine("UnicodeDesignLib.getUnicodeBlockNames");
        UnicodeDesignLib.getUnicodeBlockNames();

        Console.WriteLine("CldrDesignLib.RefreshNetSuportedCultures");
        CldrDesignLib.RefreshNetSuportedCultures();
        Console.WriteLine("CldrDesignLib.RefreshOldToNew");
        CldrDesignLib.RefreshOldToNew();
        Console.WriteLine("CldrDesignLib.RefreshTexts");
        CldrDesignLib.RefreshTexts();
        Console.WriteLine("CldrDesignLib.Build");
        CldrDesignLib.Build();

        Console.WriteLine("CldrTrans.Build");
        CldrTrans.Build();

        Console.WriteLine("LangsDesignLib.RefreshOldVersionInfo");
        LangsDesignLib.RefreshOldVersionInfo();
        Console.WriteLine("LangsDesignLib.MergeOldToCldr");
        LangsDesignLib.MergeOldToCldr();

        Console.WriteLine("CldrDesignLib.RefreshCldrStatistics");
        CldrDesignLib.RefreshCldrStatistics();

        Console.WriteLine("CldrDesignLib.BuildDart");
        CldrDesignLib.BuildDart();
        Console.WriteLine("CldrDesignLib.UnicodeDart");
        CldrDesignLib.UnicodeDart();
    }
示例#2
0
        static void Main(string[] args)
        {
            // CldrDesignLib.RefreshCldrDataSource();
            CldrDesignLib.exportForWikibulary();
            return;

            //signGoogleCloud();
            //var token = Google.Apis.Auth.OAuth2.GoogleCredential.GetApplicationDefault();
            //var res = Task.Run(() => (token as Google.Apis.Auth.OAuth2.ITokenAccess).GetAccessTokenForRequestAsync("texttospeech.googleapis.com")).Result;
            //var channelCredential = Grpc.Auth.GoogleGrpcCredentials.ToChannelCredentials(token);
            //var channel = new Grpc.Core.Channel("texttospeech.googleapis.com", channelCredential);
            //var cl = new tts.TextToSpeech.TextToSpeechClient(channel);
            //var resp = cl.ListVoices(new tts.ListVoicesRequest { LanguageCode = "" });
            //var json = resp.ToString();
            //json = null;


            using (var imp = new Impersonator.Impersonator("pavel", "LANGMaster", "zvahov88_")) {
                // **************************** DBNARY
                // WiktTtlParser.parseTtlsFirstRun(); // source in c:\Users\pavel\graphdb-import\dbnary\
                // WiktTtlParser.parseTtlsSecondRun(); // save to d:\rewise\data\wiktionary\dbnary\db\
                // CorpusIndex.dumpAll();


                // **************************** WORD NET
                // wordNet.Parser.xmlToDBFirstPhase();
                //wordNet.Parser.xmlToDBSecondPhase();
                // wordNet.Parser.dbStat();
                // WnWikt.createNewSource();

                //wordNet.Dumps.dumps();
                //wordNet.Dumps.lemmas();
                //wordNet.Dumps.langLemmas();

                // Console.WriteLine("done");
                // Console.ReadKey();

                //********** LANGS design
                //CldrLangRegionScript.CldrPatch();
                //MSSpellCheck.CldrPatch();

                //********** WIKI parsing
                //WikiRawConsts.createStat();
                //WikiRawParser.ExtractSections();
                //WikiRawParser.SectionStats();
                //WikiRawParser.CSWordSenses();
                //WikiRawParser.ParseToJson();

                // **************************** DBNARY
                //WiktTtlParser.parseTtlsFirstRun();
                //WiktTtlParser.parseTtlsSecondRun();
                //WiktDB.loadData();
                //Console.ReadKey();
                //WiktDumps.run();


                //WiktSchemaOld.run();
                //Corpus.CountIntervals.makeInts();
                //var cldr = LangsDesignDirs.cldrRepo;
                //CldrLangRegionScript2.CldrPatch();
                //Wiki.CldrPatch();
                //WiktQueries.runQueriess();

                // WiktQueries.imports();
                // WiktQueries.metaInfos();


                //WiktIdManager.allocArrays();
                //WiktSchema.dumps();

                //WiktQueries.runQueries("bg");
                //WiktReplaceUrlByIds.runs();
                //WiktReplaceUrlByIds.run("bg");
                //WiktToSQL.run("bg");
                //WiktToSQL.run("bg");

                //MSCultures.CldrPatch();
                //MSSpellCheck.CldrPatch();
                //MSStemmBreak.CldrPatch();
                //GoogleTrans.CldrPatch();

                //WikiLangs.Build();
                //var words = Corpus.Parser.parseXml(@"c:\rewise\data\wikies\bdwikimediaa", "bn-BD").ToArray();
                //words = null;
                //Corpus.Lists.frekvent("vi-VN");
                //Corpus.DownloadWikies.download();
                //Corpus.DownloadWikies.parseHome();
                //Corpus.DbpediaParser.parseTTL();

                // var count = dbCtx.Synsets.Where(s => s.Senses.Count > 1).Count();
                // count = 0;


                //var res = arab.SelectMany(entry => entry.Senses.SelectMany(sense => sense.Synset.TranslationSources)).ToArray(); //.Select(t => new {src = entry.Lemma, tran=sense.Entry.Lemma  }))).ToArray();
                //// var res = arab.Where(t => t.To.Senses.Count() == 0).Count();
                //var resFrom = arab.SelectMany(t => t.From.Senses.Select(s => s.Entry.Lemma)).Count();
                //var fromEmpty = arab.Where(t => t.From.Senses.Count==0).Count();
                //var resTo = arab.SelectMany(t => t.To.Senses.Select(s => s.Entry.Lemma)).Count();
                //resFrom = 0;

                //var ctx = wordNet.Import.getContext(true);

                //using (var rdr = new StreamReader(@"c:\temp\split\en_dbnary_ontolex_20190420.001")) {
                //  foreach (var l in rdr.ReadAllLines()) {
                //    if (l == null) throw new Exception();
                //  }
                //}

                //IGraph g = new LMGraph();
                //FileLoader.Load(g, @"c:\temp\en_dbnary_ontolex_20190420.ttl");

                //SpellCheck.withoutSpellChecker();
                //return;

                //var w = new Word.Application();
                //w.Visible = true;
                //var doc = w.Documents.Add();
                //var par = doc.Paragraphs.Add(); // .Range(start, end).InsertParagraph();
                //par.Range.Text = "Ahoj, jak se mášš?";
                //doc.Content.LanguageID = Word.WdLanguageID.wdCzech;
                //doc.SpellingChecked = false;

                //List<string> mispelled = new List<string>();
                //foreach (Word.Range word in doc.Words)
                //  foreach (Word.Range err in word.SpellingErrors) {
                //    mispelled.Add(err.Text);
                //  }

                //Console.ReadKey();

                //object dontSave = Word.WdSaveOptions.wdDoNotSaveChanges;
                //doc.Close(ref dontSave);
                //w.Quit();

                //var l = new List<int>();
                //foreach (var fn in Directory.EnumerateFiles(@"d:\rewise\data\01_csv\", "*.csv", SearchOption.AllDirectories)) {
                //  var txt = File.ReadAllText(fn); ; //.Replace('\uFEFF', ' ');
                //  var idx = txt.IndexOf('\uFEFF');
                //  if (idx < 0) continue;
                //  File.WriteAllText(fn, txt.Replace('\uFEFF', ' '), Encoding.UTF8);
                //}
                //l = null;



                //var oldLangs = "".Split(',');
                //var newLangs = oldLangs.Select(old => Langs.oldToNew(old)).JoinStrings(",");
                //newLangs = null;

                //var txt = "по́щенска ма́рка";
                //var len1 = txt.Normalize(NormalizationForm.FormC).Length;
                //var len2 = txt.Normalize(NormalizationForm.FormD).Length;
                //var len3 = txt.Normalize(NormalizationForm.FormKC).Length;
                //var len4 = txt.Normalize(NormalizationForm.FormKD).Length;
                //txt = null;

                //var lang = "de-DE";
                //foreach (var txt in new string[] { "heißen"  }) {
                //  var res = StemmerBreakerNew.Service.wordBreak(lang, new List<String>() { txt });
                //  var words = res[0].Select(p => txt.Substring(p.Pos, p.Len)).ToArray();
                //  foreach (var w in words) {
                //    var res2 = StemmerBreakerNew.Service.getWordStemms(lang, w).JoinStrings(">");
                //    res2 = null;
                //  }
                //}
                //lang = null;

                //************** IMPORT FROM RJ
                //ImportFromRJ.Import();

                //****** basic utils
                //CreateFrekventWords.run();
                //HunspellLib.extractWordLists();
                //StemmingRaw.processLangs(WordLists.wordLists);

                //************** LANGS START

                //LangsDesignLib.Build(); //ALL

                //UnicodeDesignLib.getUnicodeBlockNames();
                //CldrDesignLib.RefreshCldrDataSource();
                //CldrDesignLib.RefreshNetSuportedCultures();
                //CldrDesignLib.RefreshOldToNew();
                //CldrDesignLib.RefreshTexts();
                //CldrDesignLib.Build();
                //CldrTrans.Build();
                //CldrDesignLib.RefreshCldrStatistics();

                //LangsDesignLib.RefreshOldVersionInfo();
                //LangsDesignLib.MergeOldToCldr();

                //CldrDesignLib.BuildDart();
                //CldrDesignLib.UnicodeDart();
                //************** LANGS END

                //****** basic tests
                //var resp = Client.makeRequest(client => client.SayHello(new RewiseDom.HelloRequest { CsharpId = 1234, NoRecursion = true }));
                //Diff.Test();
                //CldrLangMatrix.load().save();

                //var lang = "en-GB";
                //foreach (var txt in new string[] { "flowers'", "flowers’" }) {
                //  var res = StemmerBreakerNew.Service.wordBreak(lang, new List<String>() { txt });
                //  var words = res[0].Select(p => txt.Substring(p.Pos, p.Len)).ToArray();
                //  foreach (var w in words) {
                //    var res2 = StemmerBreakerNew.Service.getWordStemms(lang, w).JoinStrings(">");
                //    res2 = null;
                //  }
                //}
                //lang = null;

                //Unicode.dumpNetUncLettersDiff();
                //var idxs = LangsLib.UnicodeBlockNames.blockIdxs("abcABC123-");

                //StemmingRaw.processLang(LangsLib.Metas.get(LangsLib.langs.de_de).lc, WordLists.wordLists, true, false);
                //var metas = new LangsLib.Metas();
                //StemmerBreaker.Services.testCreation();

                //****** trash

                //var reps = Sepia.Globalization.Cldr.Instance.Repositories; //C:\Users\pavel\AppData\Local\UnicodeCLDR\core
                //reps = null;

                //CultureInfoTexts.dumpCldrRbnfTypes();
                //lang_chars.extractFromMimer.extractAlphabets();
                //lang_chars.extractFromMimer.useAlphabets();

                //var config = new RewiseDom.Config();
                //config.WorkSpaces["localhost"] = new RewiseDom.WorkSpace { CsharpServer = new RewiseDom.Connection { Host = "localhost", Port = 1234 } };
                //var ser = Protobuf.ToJson(config);
                //ser = null;

                //Huffman_Encoding.Program.Main();
                //BitsProgram.Main();
                //var buf = MatrixToDartTask.import(@"c:\rewise\design\importFromRJ\appdata\source\all\GoetheVerlag.csv", null, null);
            }
        }