public static void Build() { Console.WriteLine("CldrDesignLib.RefreshCldrDataSource"); CldrDesignLib.RefreshCldrDataSource(); Console.WriteLine("UnicodeDesignLib.getUnicodeBlockNames"); UnicodeDesignLib.getUnicodeBlockNames(); Console.WriteLine("CldrDesignLib.RefreshNetSuportedCultures"); CldrDesignLib.RefreshNetSuportedCultures(); Console.WriteLine("CldrDesignLib.RefreshOldToNew"); CldrDesignLib.RefreshOldToNew(); Console.WriteLine("CldrDesignLib.RefreshTexts"); CldrDesignLib.RefreshTexts(); Console.WriteLine("CldrDesignLib.Build"); CldrDesignLib.Build(); Console.WriteLine("CldrTrans.Build"); CldrTrans.Build(); Console.WriteLine("LangsDesignLib.RefreshOldVersionInfo"); LangsDesignLib.RefreshOldVersionInfo(); Console.WriteLine("LangsDesignLib.MergeOldToCldr"); LangsDesignLib.MergeOldToCldr(); Console.WriteLine("CldrDesignLib.RefreshCldrStatistics"); CldrDesignLib.RefreshCldrStatistics(); Console.WriteLine("CldrDesignLib.BuildDart"); CldrDesignLib.BuildDart(); Console.WriteLine("CldrDesignLib.UnicodeDart"); CldrDesignLib.UnicodeDart(); }
static void Main(string[] args) { // CldrDesignLib.RefreshCldrDataSource(); CldrDesignLib.exportForWikibulary(); return; //signGoogleCloud(); //var token = Google.Apis.Auth.OAuth2.GoogleCredential.GetApplicationDefault(); //var res = Task.Run(() => (token as Google.Apis.Auth.OAuth2.ITokenAccess).GetAccessTokenForRequestAsync("texttospeech.googleapis.com")).Result; //var channelCredential = Grpc.Auth.GoogleGrpcCredentials.ToChannelCredentials(token); //var channel = new Grpc.Core.Channel("texttospeech.googleapis.com", channelCredential); //var cl = new tts.TextToSpeech.TextToSpeechClient(channel); //var resp = cl.ListVoices(new tts.ListVoicesRequest { LanguageCode = "" }); //var json = resp.ToString(); //json = null; using (var imp = new Impersonator.Impersonator("pavel", "LANGMaster", "zvahov88_")) { // **************************** DBNARY // WiktTtlParser.parseTtlsFirstRun(); // source in c:\Users\pavel\graphdb-import\dbnary\ // WiktTtlParser.parseTtlsSecondRun(); // save to d:\rewise\data\wiktionary\dbnary\db\ // CorpusIndex.dumpAll(); // **************************** WORD NET // wordNet.Parser.xmlToDBFirstPhase(); //wordNet.Parser.xmlToDBSecondPhase(); // wordNet.Parser.dbStat(); // WnWikt.createNewSource(); //wordNet.Dumps.dumps(); //wordNet.Dumps.lemmas(); //wordNet.Dumps.langLemmas(); // Console.WriteLine("done"); // Console.ReadKey(); //********** LANGS design //CldrLangRegionScript.CldrPatch(); //MSSpellCheck.CldrPatch(); //********** WIKI parsing //WikiRawConsts.createStat(); //WikiRawParser.ExtractSections(); //WikiRawParser.SectionStats(); //WikiRawParser.CSWordSenses(); //WikiRawParser.ParseToJson(); // **************************** DBNARY //WiktTtlParser.parseTtlsFirstRun(); //WiktTtlParser.parseTtlsSecondRun(); //WiktDB.loadData(); //Console.ReadKey(); //WiktDumps.run(); //WiktSchemaOld.run(); //Corpus.CountIntervals.makeInts(); //var cldr = LangsDesignDirs.cldrRepo; //CldrLangRegionScript2.CldrPatch(); //Wiki.CldrPatch(); //WiktQueries.runQueriess(); // WiktQueries.imports(); // WiktQueries.metaInfos(); //WiktIdManager.allocArrays(); //WiktSchema.dumps(); //WiktQueries.runQueries("bg"); //WiktReplaceUrlByIds.runs(); //WiktReplaceUrlByIds.run("bg"); //WiktToSQL.run("bg"); //WiktToSQL.run("bg"); //MSCultures.CldrPatch(); //MSSpellCheck.CldrPatch(); //MSStemmBreak.CldrPatch(); //GoogleTrans.CldrPatch(); //WikiLangs.Build(); //var words = Corpus.Parser.parseXml(@"c:\rewise\data\wikies\bdwikimediaa", "bn-BD").ToArray(); //words = null; //Corpus.Lists.frekvent("vi-VN"); //Corpus.DownloadWikies.download(); //Corpus.DownloadWikies.parseHome(); //Corpus.DbpediaParser.parseTTL(); // var count = dbCtx.Synsets.Where(s => s.Senses.Count > 1).Count(); // count = 0; //var res = arab.SelectMany(entry => entry.Senses.SelectMany(sense => sense.Synset.TranslationSources)).ToArray(); //.Select(t => new {src = entry.Lemma, tran=sense.Entry.Lemma }))).ToArray(); //// var res = arab.Where(t => t.To.Senses.Count() == 0).Count(); //var resFrom = arab.SelectMany(t => t.From.Senses.Select(s => s.Entry.Lemma)).Count(); //var fromEmpty = arab.Where(t => t.From.Senses.Count==0).Count(); //var resTo = arab.SelectMany(t => t.To.Senses.Select(s => s.Entry.Lemma)).Count(); //resFrom = 0; //var ctx = wordNet.Import.getContext(true); //using (var rdr = new StreamReader(@"c:\temp\split\en_dbnary_ontolex_20190420.001")) { // foreach (var l in rdr.ReadAllLines()) { // if (l == null) throw new Exception(); // } //} //IGraph g = new LMGraph(); //FileLoader.Load(g, @"c:\temp\en_dbnary_ontolex_20190420.ttl"); //SpellCheck.withoutSpellChecker(); //return; //var w = new Word.Application(); //w.Visible = true; //var doc = w.Documents.Add(); //var par = doc.Paragraphs.Add(); // .Range(start, end).InsertParagraph(); //par.Range.Text = "Ahoj, jak se mášš?"; //doc.Content.LanguageID = Word.WdLanguageID.wdCzech; //doc.SpellingChecked = false; //List<string> mispelled = new List<string>(); //foreach (Word.Range word in doc.Words) // foreach (Word.Range err in word.SpellingErrors) { // mispelled.Add(err.Text); // } //Console.ReadKey(); //object dontSave = Word.WdSaveOptions.wdDoNotSaveChanges; //doc.Close(ref dontSave); //w.Quit(); //var l = new List<int>(); //foreach (var fn in Directory.EnumerateFiles(@"d:\rewise\data\01_csv\", "*.csv", SearchOption.AllDirectories)) { // var txt = File.ReadAllText(fn); ; //.Replace('\uFEFF', ' '); // var idx = txt.IndexOf('\uFEFF'); // if (idx < 0) continue; // File.WriteAllText(fn, txt.Replace('\uFEFF', ' '), Encoding.UTF8); //} //l = null; //var oldLangs = "".Split(','); //var newLangs = oldLangs.Select(old => Langs.oldToNew(old)).JoinStrings(","); //newLangs = null; //var txt = "по́щенска ма́рка"; //var len1 = txt.Normalize(NormalizationForm.FormC).Length; //var len2 = txt.Normalize(NormalizationForm.FormD).Length; //var len3 = txt.Normalize(NormalizationForm.FormKC).Length; //var len4 = txt.Normalize(NormalizationForm.FormKD).Length; //txt = null; //var lang = "de-DE"; //foreach (var txt in new string[] { "heißen" }) { // var res = StemmerBreakerNew.Service.wordBreak(lang, new List<String>() { txt }); // var words = res[0].Select(p => txt.Substring(p.Pos, p.Len)).ToArray(); // foreach (var w in words) { // var res2 = StemmerBreakerNew.Service.getWordStemms(lang, w).JoinStrings(">"); // res2 = null; // } //} //lang = null; //************** IMPORT FROM RJ //ImportFromRJ.Import(); //****** basic utils //CreateFrekventWords.run(); //HunspellLib.extractWordLists(); //StemmingRaw.processLangs(WordLists.wordLists); //************** LANGS START //LangsDesignLib.Build(); //ALL //UnicodeDesignLib.getUnicodeBlockNames(); //CldrDesignLib.RefreshCldrDataSource(); //CldrDesignLib.RefreshNetSuportedCultures(); //CldrDesignLib.RefreshOldToNew(); //CldrDesignLib.RefreshTexts(); //CldrDesignLib.Build(); //CldrTrans.Build(); //CldrDesignLib.RefreshCldrStatistics(); //LangsDesignLib.RefreshOldVersionInfo(); //LangsDesignLib.MergeOldToCldr(); //CldrDesignLib.BuildDart(); //CldrDesignLib.UnicodeDart(); //************** LANGS END //****** basic tests //var resp = Client.makeRequest(client => client.SayHello(new RewiseDom.HelloRequest { CsharpId = 1234, NoRecursion = true })); //Diff.Test(); //CldrLangMatrix.load().save(); //var lang = "en-GB"; //foreach (var txt in new string[] { "flowers'", "flowers’" }) { // var res = StemmerBreakerNew.Service.wordBreak(lang, new List<String>() { txt }); // var words = res[0].Select(p => txt.Substring(p.Pos, p.Len)).ToArray(); // foreach (var w in words) { // var res2 = StemmerBreakerNew.Service.getWordStemms(lang, w).JoinStrings(">"); // res2 = null; // } //} //lang = null; //Unicode.dumpNetUncLettersDiff(); //var idxs = LangsLib.UnicodeBlockNames.blockIdxs("abcABC123-"); //StemmingRaw.processLang(LangsLib.Metas.get(LangsLib.langs.de_de).lc, WordLists.wordLists, true, false); //var metas = new LangsLib.Metas(); //StemmerBreaker.Services.testCreation(); //****** trash //var reps = Sepia.Globalization.Cldr.Instance.Repositories; //C:\Users\pavel\AppData\Local\UnicodeCLDR\core //reps = null; //CultureInfoTexts.dumpCldrRbnfTypes(); //lang_chars.extractFromMimer.extractAlphabets(); //lang_chars.extractFromMimer.useAlphabets(); //var config = new RewiseDom.Config(); //config.WorkSpaces["localhost"] = new RewiseDom.WorkSpace { CsharpServer = new RewiseDom.Connection { Host = "localhost", Port = 1234 } }; //var ser = Protobuf.ToJson(config); //ser = null; //Huffman_Encoding.Program.Main(); //BitsProgram.Main(); //var buf = MatrixToDartTask.import(@"c:\rewise\design\importFromRJ\appdata\source\all\GoetheVerlag.csv", null, null); } }