awesome-japanese-nlp-resources.json

{
    "version": "2.1.0",
    "contents": {
        "Python library": {
            "https://github.com/WorksApplications/sudachi.rs": {
                "sub_category": "Morphology analysis",
                "repository_name": "sudachi.rs",
                "user_name": "WorksApplications",
                "description": "SudachiPy 0.6* and above are developed as Sudachi.rs.",
                "multilingual_descriptions": {
                    "en": "SudachiPy 0.6* and above are developed as Sudachi.rs.",
                    "ja": "SudachiPy 0.6以上はSudachi.rsとして開発されています。",
                    "zh-hans": "SudachiPy 0.6及以上版本已经开发为Sudachi.rs。",
                    "zh-hant": "SudachiPy 0.6*及以上版本已開發為Sudachi.rs。"
                }
            },
            "https://github.com/mocobeta/janome": {
                "sub_category": "Morphology analysis",
                "repository_name": "janome",
                "user_name": "mocobeta",
                "description": "Japanese morphological analysis engine written in pure Python",
                "multilingual_descriptions": {
                    "en": "Japanese morphological analysis engine written in pure Python",
                    "ja": "純粋なPythonで書かれた日本語形態素解析エンジン",
                    "zh-hans": "用纯Python编写的日语形态分析引擎",
                    "zh-hant": "純Python編寫的日語形態分析引擎"
                }
            },
            "https://github.com/SamuraiT/mecab-python3": {
                "sub_category": "Morphology analysis",
                "repository_name": "mecab-python3",
                "user_name": "SamuraiT",
                "description": "mecab-python. mecab-python. you can find original version here:http://taku910.github.io/mecab/",
                "multilingual_descriptions": {
                    "en": "mecab-python. mecab-python. you can find original version here:http://taku910.github.io/mecab/",
                    "ja": "mecab-pythonです。mecab-pythonです。オリジナルバージョンはこちらから見つけることができます：http://taku910.github.io/mecab/。",
                    "zh-hans": "mecab-python。mecab-python。您可以在此处找到原始版本：http://taku910.github.io/mecab/。",
                    "zh-hant": "mecab-python。mecab-python。您可以在此處找到原始版本：http://taku910.github.io/mecab/。"
                }
            },
            "https://github.com/ikegami-yukino/mecab": {
                "sub_category": "Morphology analysis",
                "repository_name": "mecab",
                "user_name": "ikegami-yukino",
                "description": "This repository is for building Windows 64-bit MeCab binary and improving MeCab Python binding.",
                "multilingual_descriptions": {
                    "en": "This repository is for building Windows 64-bit MeCab binary and improving MeCab Python binding.",
                    "ja": "このリポジトリは、Windows 64ビット用のMeCabバイナリのビルドと、MeCab Pythonバインディングの改善に使用されます。",
                    "zh-hans": "这个仓库用于构建Windows 64位MeCab二进制文件并改进MeCab Python绑定。",
                    "zh-hant": "這個存儲庫是用於構建Windows 64位MeCab二進制文件和改進MeCab Python綁定的。"
                }
            },
            "https://github.com/polm/fugashi": {
                "sub_category": "Morphology analysis",
                "repository_name": "fugashi",
                "user_name": "polm",
                "description": "A Cython MeCab wrapper for fast, pythonic Japanese tokenization and morphological analysis.",
                "multilingual_descriptions": {
                    "en": "A Cython MeCab wrapper for fast, pythonic Japanese tokenization and morphological analysis.",
                    "ja": "高速でPythonicな日本語トークナイズと形態素解析のためのCython MeCabラッパー。",
                    "zh-hans": "一个Cython MeCab包装器，用于快速、Pythonic的日语分词和形态分析。",
                    "zh-hant": "一個Cython MeCab包裝器，用於快速、Python式的日語分詞和形態分析。"
                }
            },
            "https://github.com/taishi-i/nagisa": {
                "sub_category": "Morphology analysis",
                "repository_name": "nagisa",
                "user_name": "taishi-i",
                "description": "A Japanese tokenizer based on recurrent neural networks",
                "multilingual_descriptions": {
                    "en": "A Japanese tokenizer based on recurrent neural networks",
                    "ja": "再帰型ニューラルネットワークに基づく日本語トークナイザー",
                    "zh-hans": "基于循环神经网络的日语分词器",
                    "zh-hant": "基於循環神經網絡的日語分詞器"
                }
            },
            "https://github.com/ku-nlp/pyknp": {
                "sub_category": "Morphology analysis",
                "repository_name": "pyknp",
                "user_name": "ku-nlp",
                "description": "A Python Module for JUMAN++/KNP",
                "multilingual_descriptions": {
                    "en": "A Python Module for JUMAN++/KNP",
                    "ja": "JUMAN++/KNP用のPythonモジュール",
                    "zh-hans": "一个用于JUMAN++/KNP的Python模块",
                    "zh-hant": "一個用於 JUMAN++/KNP 的 Python 模組"
                }
            },
            "https://github.com/chezou/Mykytea-python": {
                "sub_category": "Morphology analysis",
                "repository_name": "Mykytea-python",
                "user_name": "chezou",
                "description": "Python wrapper for KyTea",
                "multilingual_descriptions": {
                    "en": "Python wrapper for KyTea",
                    "ja": "KyTeaのPythonラッパー",
                    "zh-hans": "KyTea的Python封装程序",
                    "zh-hant": "KyTea 的 Python 封裝程式"
                }
            },
            "https://github.com/himkt/konoha": {
                "sub_category": "Morphology analysis",
                "repository_name": "konoha",
                "user_name": "himkt",
                "description": "Konoha: Simple wrapper of Japanese Tokenizers",
                "multilingual_descriptions": {
                    "en": "Konoha: Simple wrapper of Japanese Tokenizers",
                    "ja": "Konoha：日本語トークナイザーのシンプルなラッパー",
                    "zh-hans": "Konoha：日语分词器的简单封装",
                    "zh-hant": "木葉：日本分詞器的簡單封裝"
                }
            },
            "https://github.com/buruzaemon/natto-py": {
                "sub_category": "Morphology analysis",
                "repository_name": "natto-py",
                "user_name": "buruzaemon",
                "description": "natto-py combines the Python programming language with MeCab, the part-of-speech and morphological analyzer for the Japanese language.",
                "multilingual_descriptions": {
                    "en": "natto-py combines the Python programming language with MeCab, the part-of-speech and morphological analyzer for the Japanese language.",
                    "ja": "natto-pyは、Pythonプログラミング言語と日本語の品詞や形態素解析器であるMeCabを組み合わせたものです。",
                    "zh-hans": "natto-py将Python编程语言与MeCab（日语的词性和形态分析器）结合起来。",
                    "zh-hant": "natto-py 將 Python 程式語言與 MeCab 結合，後者是日語詞性和形態分析器。"
                }
            },
            "https://github.com/ikegami-yukino/rakutenma-python": {
                "sub_category": "Morphology analysis",
                "repository_name": "rakutenma-python",
                "user_name": "ikegami-yukino",
                "description": "Rakuten MA (Python version)",
                "multilingual_descriptions": {
                    "en": "Rakuten MA (Python version)",
                    "ja": "楽天MA（Python版）",
                    "zh-hans": "乐天 MA（Python 版本）",
                    "zh-hant": "樂天 MA（Python 版本）"
                }
            },
            "https://github.com/daac-tools/python-vaporetto": {
                "sub_category": "Morphology analysis",
                "repository_name": "python-vaporetto",
                "user_name": "daac-tools",
                "description": "Vaporetto is a fast and lightweight pointwise prediction based tokenizer. This is a Python wrapper for Vaporetto.",
                "multilingual_descriptions": {
                    "en": " Vaporetto is a fast and lightweight pointwise prediction based tokenizer. This is a Python wrapper for Vaporetto.",
                    "ja": "Vaporettoは、高速で軽量なポイントワイズ予測ベースのトークナイザーです。これはVaporettoのPythonラッパーです。",
                    "zh-hans": "Vaporetto是一种快速且轻量级的基于点预测的分词器。这是Vaporetto的Python封装。",
                    "zh-hant": "Vaporetto 是一個快速且輕量級的基於點預測的分詞器。這是 Vaporetto 的 Python 封裝。"
                }
            },
            "https://github.com/mkartawijaya/dango": {
                "sub_category": "Morphology analysis",
                "repository_name": "dango",
                "user_name": "mkartawijaya",
                "description": "An easy to use tokenizer for Japanese text, aimed at language learners and non-linguists",
                "multilingual_descriptions": {
                    "en": "An easy to use tokenizer for Japanese text, aimed at language learners and non-linguists",
                    "ja": "日本語テキスト用の使いやすいトークナイザー。言語学習者や非言語学者を対象としています。",
                    "zh-hans": "一个易于使用的日语文本分词器，旨在为语言学习者和非语言学家提供帮助。",
                    "zh-hant": "一個易於使用的日文分詞器，針對語言學習者和非語言學家。"
                }
            },
            "https://github.com/ku-nlp/rhoknp": {
                "sub_category": "Morphology analysis",
                "repository_name": "rhoknp",
                "user_name": "ku-nlp",
                "description": "Yet another Python binding for Juman++/KNP",
                "multilingual_descriptions": {
                    "en": "Yet another Python binding for Juman++/KNP",
                    "ja": "Juman++/KNPのための別のPythonバインディング",
                    "zh-hans": "又一个Python绑定Juman++/KNP",
                    "zh-hant": "又一個 Juman++/KNP 的 Python 綁定程式"
                }
            },
            "https://github.com/daac-tools/python-vibrato": {
                "sub_category": "Morphology analysis",
                "repository_name": "python-vibrato",
                "user_name": "daac-tools",
                "description": "Viterbi-based accelerated tokenizer (Python wrapper)",
                "multilingual_descriptions": {
                    "en": " Viterbi-based accelerated tokenizer (Python wrapper)",
                    "ja": "Viterbiベースの高速トークナイザー（Pythonラッパー）",
                    "zh-hans": "基于维特比算法的加速分词器（Python封装）",
                    "zh-hant": "基於維特比算法的加速分詞器（Python封裝）"
                }
            },
            "https://github.com/lighttransport/jagger-python": {
                "sub_category": "Morphology analysis",
                "repository_name": "jagger-python",
                "user_name": "lighttransport",
                "description": "Python binding for Jagger(C++ implementation of Pattern-based Japanese Morphological Analyzer)",
                "multilingual_descriptions": {
                    "en": "Python binding for Jagger(C++ implementation of Pattern-based Japanese Morphological Analyzer)",
                    "ja": "JaggerのPythonバインディング（パターンベースの日本語形態素解析器のC++実装）",
                    "zh-hans": "Python绑定Jagger（基于模式的日语形态分析器的C++实现）",
                    "zh-hant": "Jagger的Python綁定（基於模式的日語形態分析器的C++實現）"
                }
            },
            "https://github.com/megagonlabs/ginza": {
                "sub_category": "Parsing",
                "repository_name": "ginza",
                "user_name": "megagonlabs",
                "description": "A Japanese NLP Library using spaCy as framework based on Universal Dependencies",
                "multilingual_descriptions": {
                    "en": "A Japanese NLP Library using spaCy as framework based on Universal Dependencies",
                    "ja": "ユニバーサル依存関係に基づくspaCyフレームワークを使用した日本語NLPライブラリ",
                    "zh-hans": "一个基于通用依存关系的spaCy框架的日语NLP库。",
                    "zh-hant": "一個基於Universal Dependencies的spaCy框架的日本NLP庫"
                }
            },
            "https://github.com/ikegami-yukino/cabocha": {
                "sub_category": "Parsing",
                "repository_name": "cabocha",
                "user_name": "ikegami-yukino",
                "description": "Yet Another Japanese Dependency Structure Analyzer",
                "multilingual_descriptions": {
                    "en": "Yet Another Japanese Dependency Structure Analyzer",
                    "ja": "もう一つの日本語依存構造解析ツール",
                    "zh-hans": "另一个日语依存结构分析器",
                    "zh-hant": "另一個日本依存結構分析器"
                }
            },
            "https://github.com/KoichiYasuoka/UniDic2UD": {
                "sub_category": "Parsing",
                "repository_name": "UniDic2UD",
                "user_name": "KoichiYasuoka",
                "description": "Tokenizer POS-tagger Lemmatizer and Dependency-parser for modern and contemporary Japanese",
                "multilingual_descriptions": {
                    "en": "Tokenizer POS-tagger Lemmatizer and Dependency-parser for modern and contemporary Japanese",
                    "ja": "現代日本語のためのトークナイザー、POSタガー、レンマ化器、依存構造解析器",
                    "zh-hans": "现代和当代日语的分词器、词性标注器、词形还原器和依存句法分析器",
                    "zh-hant": "現代和當代日語的分詞器、詞性標記器、詞形還原器和依存句法分析器"
                }
            },
            "https://github.com/PKSHATechnology-Research/camphr": {
                "sub_category": "Parsing",
                "repository_name": "camphr",
                "user_name": "PKSHATechnology-Research",
                "description": "NLP libary for creating pipeline components",
                "multilingual_descriptions": {
                    "en": "Camphr - NLP libary for creating pipeline components",
                    "ja": "Camphr - パイプラインコンポーネントを作成するためのNLPライブラリ",
                    "zh-hans": "Camphr - 用于创建管道组件的NLP库",
                    "zh-hant": "Camphr - 用於創建管道組件的 NLP 庫"
                }
            },
            "https://github.com/KoichiYasuoka/SuPar-UniDic": {
                "sub_category": "Parsing",
                "repository_name": "SuPar-UniDic",
                "user_name": "KoichiYasuoka",
                "description": "Tokenizer POS-tagger Lemmatizer and Dependency-parser for modern and contemporary Japanese with BERT models",
                "multilingual_descriptions": {
                    "en": "Tokenizer POS-tagger Lemmatizer and Dependency-parser for modern and contemporary Japanese with BERT models",
                    "ja": "モダン・コンテンポラリー日本語用のTokenizer、POS-tagger、Lemmatizer、およびDependency-parserには、BERTモデルが使用されます。",
                    "zh-hans": "使用BERT模型的现代和当代日语分词器、词性标注器、词形还原器和依存句法分析器。",
                    "zh-hant": "使用BERT模型的現代和當代日語分詞器、詞性標記器、詞形還原器和依存句法分析器"
                }
            },
            "https://github.com/masashi-y/depccg": {
                "sub_category": "Parsing",
                "repository_name": "depccg",
                "user_name": "masashi-y",
                "description": "A* CCG Parser with a Supertag and Dependency Factored Model",
                "multilingual_descriptions": {
                    "en": "A* CCG Parser with a Supertag and Dependency Factored Model",
                    "ja": "スーパータグと依存関係ファクタリングモデルを備えたA* CCGパーサー",
                    "zh-hans": "带有超级标签和依存因素模型的A* CCG解析器",
                    "zh-hant": "具有超標記和依存因素模型的A* CCG解析器"
                }
            },
            "https://github.com/ku-nlp/bertknp": {
                "sub_category": "Parsing",
                "repository_name": "bertknp",
                "user_name": "ku-nlp",
                "description": "A Japanese dependency parser based on BERT",
                "multilingual_descriptions": {
                    "en": "A Japanese dependency parser based on BERT",
                    "ja": "BERTに基づく日本語依存構造解析器",
                    "zh-hans": "基于BERT的日语依存句法分析器",
                    "zh-hant": "基於BERT的日語依存句法分析器"
                }
            },
            "https://github.com/KoichiYasuoka/esupar": {
                "sub_category": "Parsing",
                "repository_name": "esupar",
                "user_name": "KoichiYasuoka",
                "description": "Tokenizer POS-Tagger and Dependency-parser with BERT/RoBERTa/DeBERTa models for Japanese and other languages",
                "multilingual_descriptions": {
                    "en": "Tokenizer POS-Tagger and Dependency-parser with BERT/RoBERTa/DeBERTa models for Japanese and other languages",
                    "ja": "日本語や他の言語に対応したBERT/RoBERTa/DeBERTaモデルを使用したトークナイザー、POSタガー、依存構造解析器。",
                    "zh-hans": "使用BERT/RoBERTa/DeBERTa模型的分词器POS-标注器和依存句法分析器，适用于日语和其他语言。",
                    "zh-hant": "使用BERT/RoBERTa/DeBERTa模型的分詞器POS-標記器和依存句法分析器，適用於日語和其他語言。"
                }
            },
            "https://github.com/passaglia/yomikata": {
                "sub_category": "Parsing",
                "repository_name": "yomikata",
                "user_name": "passaglia",
                "description": "Heteronym disambiguation library using a fine-tuned BERT model.",
                "multilingual_descriptions": {
                    "en": "Heteronym disambiguation library using a fine-tuned BERT model.",
                    "ja": "微調整されたBERTモデルを使用した異音異義語の曖昧性解消ライブラリ。",
                    "zh-hans": "使用经过微调的BERT模型的异音词消歧库。",
                    "zh-hant": "使用微調的BERT模型進行異音詞消歧的程式庫。"
                }
            },
            "https://github.com/lighttransport/jdepp-python": {
                "sub_category": "Parsing",
                "repository_name": "jdepp-python",
                "user_name": "lighttransport",
                "description": "Python binding for J.DepP(C++ implementation of Japanese Dependency Parsers)",
                "multilingual_descriptions": {
                    "en": "Python binding for J.DepP(C++ implementation of Japanese Dependency Parsers)",
                    "ja": "J.DepPのPythonバインディング（日本語依存構造解析器のC++実装）",
                    "zh-hans": "Python绑定J.DepP（日语依存解析器的C++实现）",
                    "zh-hant": "J.DepP的Python綁定（日本依存句法分析器的C++實現）"
                }
            },
            "https://github.com/daisukebekki/lightblue": {
                "sub_category": "Parsing",
                "repository_name": "lightblue",
                "user_name": "daisukebekki",
                "description": "A CCG parser for Japanese with DTS-representations",
                "multilingual_descriptions": {
                    "en": "A CCG parser for Japanese with DTS-representations",
                    "ja": "DTS表現を使用した日本語のCCGパーサー",
                    "zh-hans": "一个用于日语的带有DTS表示的CCG解析器",
                    "zh-hant": "一個具有DTS表示的日語CCG解析器"
                }
            },
            "https://github.com/borh-lab/natsume-simple": {
                "sub_category": "Parsing",
                "repository_name": "natsume-simple",
                "user_name": "borh-lab",
                "description": "natsume-simpleは日本語の係り受け関係検索システム",
                "multilingual_descriptions": {
                    "en": "natsume-simple is a Japanese dependency relation search system.",
                    "ja": "natsume-simpleは日本語の係り受け関係検索システム",
                    "zh-hans": "natsume-simple是一个日语依存关系搜索系统",
                    "zh-hant": "natsume-simple是一個日語的依存關係搜索系統。"
                }
            },
            "https://github.com/miurahr/pykakasi": {
                "sub_category": "Converter",
                "repository_name": "pykakasi",
                "user_name": "miurahr",
                "description": "Lightweight converter from Japanese Kana-kanji sentences into Kana-Roman.",
                "multilingual_descriptions": {
                    "en": "Lightweight converter from Japanese Kana-kanji sentences into Kana-Roman.",
                    "ja": "日本語の仮名漢字文から仮名ローマ字文に変換する軽量コンバーター。",
                    "zh-hans": "将日语假名汉字句子转换为假名罗马字的轻量级转换器。",
                    "zh-hant": "輕量級的轉換器，可將日文假名漢字句子轉換為假名羅馬字。"
                }
            },
            "https://github.com/polm/cutlet": {
                "sub_category": "Converter",
                "repository_name": "cutlet",
                "user_name": "polm",
                "description": "Japanese to romaji converter in Python",
                "multilingual_descriptions": {
                    "en": "Japanese to romaji converter in Python",
                    "ja": "Pythonでの日本語からローマ字への変換ツール",
                    "zh-hans": "Python中的日语转罗马字转换器",
                    "zh-hant": "Python中的日文轉羅馬字轉換器"
                }
            },
            "https://github.com/shihono/alphabet2kana": {
                "sub_category": "Converter",
                "repository_name": "alphabet2kana",
                "user_name": "shihono",
                "description": "Convert English alphabet to Katakana",
                "multilingual_descriptions": {
                    "en": "Convert English alphabet to Katakana",
                    "ja": "英語アルファベットをカタカナに変換してください。",
                    "zh-hans": "将英文字母转换为片假名",
                    "zh-hant": "將英文字母轉換為片假名"
                }
            },
            "https://github.com/Greatdane/Convert-Numbers-to-Japanese": {
                "sub_category": "Converter",
                "repository_name": "Convert-Numbers-to-Japanese",
                "user_name": "Greatdane",
                "description": "Converts Arabic numerals, or 'western' style numbers, to a Japanese context.",
                "multilingual_descriptions": {
                    "en": "Converts Arabic numerals, or 'western' style numbers, to a Japanese context.",
                    "ja": "アラビア数字、または「西洋式」の数字を日本の文脈に変換します。",
                    "zh-hans": "将阿拉伯数字或“西方”风格的数字转换为日本语境。",
                    "zh-hant": "將阿拉伯數字或「西方」風格的數字轉換為日本上下文。"
                }
            },
            "https://github.com/ikegami-yukino/mozcpy": {
                "sub_category": "Converter",
                "repository_name": "mozcpy",
                "user_name": "ikegami-yukino",
                "description": "Mozc for Python: Kana-Kanji converter",
                "multilingual_descriptions": {
                    "en": "Mozc for Python: Kana-Kanji converter",
                    "ja": "Python用Mozc：かな漢字変換器",
                    "zh-hans": "Python的Mozc：假名汉字转换器",
                    "zh-hant": "Python的Mozc：假名漢字轉換器"
                }
            },
            "https://github.com/tachi-hi/jamorasep": {
                "sub_category": "Converter",
                "repository_name": "jamorasep",
                "user_name": "tachi-hi",
                "description": "Japanese text parser to separate Hiragana/Katakana string into morae (syllables).",
                "multilingual_descriptions": {
                    "en": "Japanese text parser that separates Hiragana/Katakana strings into morae (syllables).",
                    "ja": "ひらがな/カタカナの文字列をモーラ（音節）に分割する日本語テキストパーサー。",
                    "zh-hans": "日语文本解析器，将平假名/片假名字符串分离成音节（拼音）。",
                    "zh-hant": "日文文本解析器，將平假名/片假名字符串分離成音節（拼音）。"
                }
            },
            "https://github.com/korguchi/text2phoneme": {
                "sub_category": "Converter",
                "repository_name": "text2phoneme",
                "user_name": "korguchi",
                "description": "日本語文を音素列へ変換するスクリプト",
                "multilingual_descriptions": {
                    "en": "Script to convert Japanese text into phoneme sequence.",
                    "ja": "日本語文を音素列へ変換するスクリプト",
                    "zh-hans": "将日语文本转换为音素序列的脚本",
                    "zh-hant": "將日文轉換為音素序列的腳本"
                }
            },
            "https://github.com/opencollector/jntajis-python": {
                "sub_category": "Converter",
                "repository_name": "jntajis-python",
                "user_name": "opencollector",
                "description": "A fast character conversion and transliteration library based on the scheme defined for Japan National Tax Agency (国税庁) 's",
                "multilingual_descriptions": {
                    "en": "A fast character conversion and transliteration library based on the scheme defined for Japan National Tax Agency (国税庁) 's corporate number (法人番号) system.",
                    "ja": "日本国税庁の法人番号システムで定義されたスキームに基づく、高速な文字変換および転写ライブラリ。",
                    "zh-hans": "一个快速的字符转换和音译库，基于日本国税局的法人番号系统定义的方案。",
                    "zh-hant": "一個快速的字符轉換和音譯庫，基於日本國稅廳的法人番號系統定義的方案。"
                }
            },
            "https://github.com/eggplants/wiredify": {
                "sub_category": "Converter",
                "repository_name": "wiredify",
                "user_name": "eggplants",
                "description": "Convert japanese kana from ba-bi-bu-be-bo into va-vi-vu-ve-vo",
                "multilingual_descriptions": {
                    "en": "Convert japanese kana from ba-bi-bu-be-bo into va-vi-vu-ve-vo",
                    "ja": "「ばびぶべぼ」から「ヴァヴィヴヴェヴォ」に変換してください。",
                    "zh-hans": "将日语假名从ba-bi-bu-be-bo转换为va-vi-vu-ve-vo",
                    "zh-hant": "將日文假名從ba-bi-bu-be-bo轉換為va-vi-vu-ve-vo\n將日文假名從ba-bi-bu-be-bo轉換為va-vi-vu-ve-vo"
                }
            },
            "https://github.com/34j/mecab-text-cleaner": {
                "sub_category": "Converter",
                "repository_name": "mecab-text-cleaner",
                "user_name": "34j",
                "description": "Simple Python package (CLI/Python API) for getting japanese readings (yomigana) and accents using MeCab.",
                "multilingual_descriptions": {
                    "en": "Simple Python package (CLI/Python API) for getting japanese readings (yomigana) and accents using MeCab.",
                    "ja": "MeCabを使用して、日本語の読み仮名とアクセントを取得するためのシンプルなPythonパッケージ（CLI/Python API）。",
                    "zh-hans": "使用MeCab获取日语读音（yomigana）和重音的简单Python包（CLI/Python API）。",
                    "zh-hant": "使用MeCab獲取日文讀音（yomigana）和重音的簡單Python套件（CLI/Python API）。"
                }
            },
            "https://github.com/tkscode/pynormalizenumexp": {
                "sub_category": "Converter",
                "repository_name": "pynormalizenumexp",
                "user_name": "tkscode",
                "description": "数量表現や時間表現の抽出・正規化を行うNormalizeNumexpのPython実装",
                "multilingual_descriptions": {
                    "en": "Python implementation of NormalizeNumexp for extracting and normalizing quantity expressions and time expressions.",
                    "ja": "数量表現や時間表現の抽出・正規化を行うNormalizeNumexpのPython実装\n\n数量表現や時間表現の抽出・正規化を行うNormalizeNumexpのPython実装",
                    "zh-hans": "使用Python实现NormalizeNumexp，用于提取和规范化数量和时间表达式。",
                    "zh-hant": "執行NormalizeNumexp的Python實作，進行數量表達和時間表達的提取和規範化。"
                }
            },
            "https://github.com/nagataaaas/Jusho": {
                "sub_category": "Converter",
                "repository_name": "Jusho",
                "user_name": "nagataaaas",
                "description": "Easy wrapper for the postal code data of Japan",
                "multilingual_descriptions": {
                    "en": "Easy wrapper for the postal code data of Japan",
                    "ja": "日本の郵便番号データの簡単なラッパー",
                    "zh-hans": "日本邮政编码数据的简易封装器",
                    "zh-hant": "日本郵政編碼數據的簡單封裝"
                }
            },
            "https://github.com/sea-turt1e/yurenizer": {
                "sub_category": "Converter",
                "repository_name": "yurenizer",
                "user_name": "sea-turt1e",
                "description": "Japanese text normalizer that resolves spelling inconsistencies. （日本語表記揺れ解消ツール）",
                "multilingual_descriptions": {
                    "en": "Japanese text normalizer that resolves spelling inconsistencies. （日本語表記揺れ解消ツール",
                    "ja": "日本語テキストの表記の一貫性を解消する日本語テキスト正規化ツール",
                    "zh-hans": "日语文本规范化工具，解决拼写不一致问题。",
                    "zh-hant": "日文文本正規化工具，解決拼寫不一致。"
                }
            },
            "https://github.com/ikegami-yukino/neologdn": {
                "sub_category": "Preprocessor",
                "repository_name": "neologdn",
                "user_name": "ikegami-yukino",
                "description": "Japanese text normalizer for mecab-neologd",
                "multilingual_descriptions": {
                    "en": "Japanese text normalizer for mecab-neologd",
                    "ja": "mecab-neologd用の日本語テキスト正規化ツール",
                    "zh-hans": "针对mecab-neologd的日语文本规范化工具",
                    "zh-hant": "mecab-neologd 的日文文本正規化工具"
                }
            },
            "https://github.com/ikegami-yukino/jaconv": {
                "sub_category": "Preprocessor",
                "repository_name": "jaconv",
                "user_name": "ikegami-yukino",
                "description": "Pure-Python Japanese character interconverter for Hiragana, Katakana, Hankaku, and Zenkaku",
                "multilingual_descriptions": {
                    "en": "A Python-based tool for converting Japanese characters between Hiragana, Katakana, Hankaku, and Zenkaku.",
                    "ja": "ひらがな、カタカナ、半角、全角のための純粋なPython日本語文字相互変換器",
                    "zh-hans": "纯Python日语字符互转器，支持平假名、片假名、半角和全角。",
                    "zh-hant": "純Python日文字符互轉器，支援平假名、片假名、半角和全角。"
                }
            },
            "https://github.com/studio-ousia/mojimoji": {
                "sub_category": "Preprocessor",
                "repository_name": "mojimoji",
                "user_name": "studio-ousia",
                "description": "A fast converter between Japanese hankaku and zenkaku characters",
                "multilingual_descriptions": {
                    "en": "A quick converter for Japanese half-width and full-width characters.",
                    "ja": "日本語半角と全角の素早い変換ツール",
                    "zh-hans": "一个快速转换日语半角和全角字符的转换器",
                    "zh-hant": "一個快速轉換日文半角和全角字符的轉換器"
                }
            },
            "https://github.com/ku-nlp/text-cleaning": {
                "sub_category": "Preprocessor",
                "repository_name": "text-cleaning",
                "user_name": "ku-nlp",
                "description": "A powerful text cleaner for Japanese web texts",
                "multilingual_descriptions": {
                    "en": "A powerful text cleaner for Japanese web texts",
                    "ja": "日本語のウェブテキスト用の強力なテキストクリーナー",
                    "zh-hans": "一款强大的日语网页文本清理工具",
                    "zh-hant": "一款強大的日文網頁文本清理工具"
                }
            },
            "https://github.com/HojiChar/HojiChar": {
                "sub_category": "Preprocessor",
                "repository_name": "HojiChar",
                "user_name": "HojiChar",
                "description": "複数の前処理を構成して管理するテキスト前処理ツール",
                "multilingual_descriptions": {
                    "en": "A text preprocessing tool that configures and manages multiple preprocessing steps.",
                    "ja": "複数の前処理を構成して管理するテキスト前処理ツール",
                    "zh-hans": "管理多个前处理的文本前处理工具",
                    "zh-hant": "構成並管理多個前處理的文字前處理工具"
                }
            },
            "https://github.com/juno-rmks/utsuho": {
                "sub_category": "Preprocessor",
                "repository_name": "utsuho",
                "user_name": "juno-rmks",
                "description": "Utsuho is a Python module that facilitates bidirectional conversion between half-width katakana and full-width katakana in Japanese.",
                "multilingual_descriptions": {
                    "en": "Utsuho is a Python module that facilitates bidirectional conversion between half-width katakana and full-width katakana in Japanese.",
                    "ja": "Utsuhoは、日本語の半角カタカナと全角カタカナの間で双方向変換を容易にするPythonモジュールです。",
                    "zh-hans": "Utsuho是一个Python模块，用于在日语中半角片假名和全角片假名之间进行双向转换的工具。",
                    "zh-hant": "Utsuho是一個Python模組，用於在日語中半角片假名和全角片假名之間進行雙向轉換。"
                }
            },
            "https://github.com/Hizuru3/python-habachen": {
                "sub_category": "Preprocessor",
                "repository_name": "python-habachen",
                "user_name": "Hizuru3",
                "description": "Yet Another Fast Japanese String Converter",
                "multilingual_descriptions": {
                    "en": "Yet Another Fast Japanese String Converter",
                    "ja": "もう一つの高速な日本語文字列変換ツール",
                    "zh-hans": "另一个快速的日语字符串转换器",
                    "zh-hant": "另一個快速的日本字符串轉換器"
                }
            },
            "https://github.com/bikatr7/kairyou": {
                "sub_category": "Preprocessor",
                "repository_name": "kairyou",
                "user_name": "bikatr7",
                "description": "Quickly preprocesses Japanese text using NLP/NER from SpaCy for Japanese translation or other NLP tasks.",
                "multilingual_descriptions": {
                    "en": "Quickly preprocesses Japanese text using NLP/NER from SpaCy for Japanese translation or other NLP tasks.",
                    "ja": "SpaCyを使用して、日本語テキストをNLP/NERで迅速に前処理し、日本語翻訳やその他のNLPタスクに使用します。",
                    "zh-hans": "使用SpaCy快速预处理日文文本，以便进行日文翻译或其他自然语言处理任务。",
                    "zh-hant": "使用SpaCy快速預處理日文文本，以進行日文翻譯或其他NLP任務。"
                }
            },
            "https://github.com/megagonlabs/bunkai": {
                "sub_category": "Sentence spliter",
                "repository_name": "bunkai",
                "user_name": "megagonlabs",
                "description": "Sentence boundary disambiguation tool for Japanese texts (日本語文境界判定器)",
                "multilingual_descriptions": {
                    "en": "Sentence boundary disambiguation tool for Japanese texts (日本語文境界判定器)",
                    "ja": "日本語テキストの文境界曖昧性解消ツール (にほんごぶんきょうかいはんていき)",
                    "zh-hans": "日语文本句子边界消歧工具",
                    "zh-hant": "日本語文境界判定工具"
                }
            },
            "https://github.com/hppRC/japanese-sentence-breaker": {
                "sub_category": "Sentence spliter",
                "repository_name": "japanese-sentence-breaker",
                "user_name": "hppRC",
                "description": "Japanese Sentence Breaker",
                "multilingual_descriptions": {
                    "en": "Japanese Sentence Breaker",
                    "ja": "日本語の文分割器",
                    "zh-hans": "日语句子分割器",
                    "zh-hant": "日本語句子分解器"
                }
            },
            "https://github.com/ikegami-yukino/sengiri": {
                "sub_category": "Sentence spliter",
                "repository_name": "sengiri",
                "user_name": "ikegami-yukino",
                "description": "Yet another sentence-level tokenizer for the Japanese text",
                "multilingual_descriptions": {
                    "en": "Yet another sentence-level tokenizer for the Japanese text",
                    "ja": "日本語テキストのための別の文レベルのトークナイザー",
                    "zh-hans": "又一个用于日语文本的句子级分词器",
                    "zh-hant": "另一個針對日文文本的句子級分詞器"
                }
            },
            "https://github.com/google/budoux": {
                "sub_category": "Sentence spliter",
                "repository_name": "budoux",
                "user_name": "google",
                "description": "Standalone. Small. Language-neutral. BudouX is the successor to Budou, the machine learning powered line break organizer tool.",
                "multilingual_descriptions": {
                    "en": "Standalone. Small. Language-neutral. BudouX is the successor to Budou, the machine learning powered line break organizer tool.",
                    "ja": "スタンドアロン。小さい。言語に依存しない。BudouXは、機械学習による行の整理ツールであるBudouの後継者です。",
                    "zh-hans": "独立的。小巧的。语言中立的。BudouX是机器学习驱动的断行组织工具Budou的继承者。",
                    "zh-hant": "獨立的。小巧的。語言中立的。BudouX 是機器學習驅動的斷行整理工具 Budou 的後繼者。"
                }
            },
            "https://github.com/wwwcojp/ja_sentence_segmenter": {
                "sub_category": "Sentence spliter",
                "repository_name": "ja_sentence_segmenter",
                "user_name": "wwwcojp",
                "description": "japanese sentence segmentation library for python",
                "multilingual_descriptions": {
                    "en": "japanese sentence segmentation library for python",
                    "ja": "Python用の日本語文分割ライブラリ",
                    "zh-hans": "Python的日语句子分割库",
                    "zh-hant": "Python 的日文句子分割程式庫"
                }
            },
            "https://github.com/mkartawijaya/hasami": {
                "sub_category": "Sentence spliter",
                "repository_name": "hasami",
                "user_name": "mkartawijaya",
                "description": "A tool to perform sentence segmentation on Japanese text",
                "multilingual_descriptions": {
                    "en": "A tool to perform sentence segmentation on Japanese text",
                    "ja": "日本語テキストの文分割を実行するツール",
                    "zh-hans": "一个用于对日语文本进行句子分割的工具",
                    "zh-hant": "一個用於對日文文本進行句子分割的工具"
                }
            },
            "https://github.com/alinear-corp/kuzukiri": {
                "sub_category": "Sentence spliter",
                "repository_name": "kuzukiri",
                "user_name": "alinear-corp",
                "description": "Japanese Text Segmenter for Python written in Rust",
                "multilingual_descriptions": {
                    "en": "Japanese Text Segmenter for Python written in Rust",
                    "ja": "Rustで書かれたPython用の日本語テキストセグメンター",
                    "zh-hans": "用Rust编写的Python日语文本分段器",
                    "zh-hant": "用 Rust 編寫的 Python 日文文本分割器"
                }
            },
            "https://github.com/hkiyomaru/ja-senter-benchmark": {
                "sub_category": "Sentence spliter",
                "repository_name": "ja-senter-benchmark",
                "user_name": "hkiyomaru",
                "description": "Comparison of Japanese Sentence Segmentation Tools",
                "multilingual_descriptions": {
                    "en": "Comparison of Japanese Sentence Segmentation Tools",
                    "ja": "日本語文分割ツールの比較",
                    "zh-hans": "日语句子分割工具比较",
                    "zh-hant": "日本語句子分割工具比較"
                }
            },
            "https://github.com/ikegami-yukino/oseti": {
                "sub_category": "Sentiment analysis",
                "repository_name": "oseti",
                "user_name": "ikegami-yukino",
                "description": "Dictionary based Sentiment Analysis for Japanese",
                "multilingual_descriptions": {
                    "en": "Dictionary based Sentiment Analysis for Japanese",
                    "ja": "日本語の辞書ベースの感情分析",
                    "zh-hans": "基于词典的日语情感分析",
                    "zh-hant": "基於詞典的日語情感分析"
                }
            },
            "https://github.com/liaoziyang/negapoji": {
                "sub_category": "Sentiment analysis",
                "repository_name": "negapoji",
                "user_name": "liaoziyang",
                "description": "Japanese negative positive classification.日本語文書のネガポジを判定。",
                "multilingual_descriptions": {
                    "en": "Japanese document sentiment analysis to determine negative or positive.",
                    "ja": "日本語のネガティブ・ポジティブの分類。日本語の文章のネガティブ・ポジティブを判定します。",
                    "zh-hans": "日语文档的负面和正面分类判断。",
                    "zh-hant": "日本語文書的正負面分類。"
                }
            },
            "https://github.com/ikegami-yukino/pymlask": {
                "sub_category": "Sentiment analysis",
                "repository_name": "pymlask",
                "user_name": "ikegami-yukino",
                "description": "Emotion analyzer for Japanese text",
                "multilingual_descriptions": {
                    "en": "Emotion analyzer for Japanese text",
                    "ja": "日本語テキストの感情分析ツール",
                    "zh-hans": "日语文本情感分析器",
                    "zh-hant": "日文文本情感分析器"
                }
            },
            "https://github.com/Hironsan/asari": {
                "sub_category": "Sentiment analysis",
                "repository_name": "asari",
                "user_name": "Hironsan",
                "description": "Japanese sentiment analyzer implemented in Python.",
                "multilingual_descriptions": {
                    "en": "Japanese sentiment analyzer implemented in Python.",
                    "ja": "Pythonで実装された日本語感情分析器。",
                    "zh-hans": "Python实现的日语情感分析器。",
                    "zh-hant": "使用Python實現的日語情感分析器。"
                }
            },
            "https://github.com/MorinoseiMorizo/jparacrawl-finetune": {
                "sub_category": "Machine translation",
                "repository_name": "jparacrawl-finetune",
                "user_name": "MorinoseiMorizo",
                "description": "An example usage of JParaCrawl pre-trained Neural Machine Translation (NMT) models.",
                "multilingual_descriptions": {
                    "en": "An example usage of JParaCrawl pre-trained Neural Machine Translation (NMT) models.",
                    "ja": "JParaCrawlの事前学習済みニューラル機械翻訳（NMT）モデルの使用例。",
                    "zh-hans": "JParaCrawl预训练神经机器翻译（NMT）模型的示例用法。",
                    "zh-hant": "JParaCrawl 預訓練神經機器翻譯 (NMT) 模型的使用示例。"
                }
            },
            "https://github.com/Mao-KU/JASS": {
                "sub_category": "Machine translation",
                "repository_name": "JASS",
                "user_name": "Mao-KU",
                "description": "JASS: Japanese-specific Sequence to Sequence Pre-training for Neural Machine Translation (LREC2020) & Linguistically Driven Multi-Task Pre-Training for Low-Resource Neural Machine Translation (ACM TALLIP)",
                "multilingual_descriptions": {
                    "en": "JASS: Japanese-specific Sequence to Sequence Pre-training for Neural Machine Translation (LREC2020) & Linguistically Driven Multi-Task Pre-Training for Low-Resource Neural Machine Translation (ACM TALLIP)",
                    "ja": "JASS：ニューラル機械翻訳のための日本語固有のシーケンス・トゥ・シーケンス事前学習（LREC2020）＆言語学的に駆動された低リソースニューラル機械翻訳のためのマルチタスク事前学習（ACM TALLIP）",
                    "zh-hans": "JASS：面向日本特定序列到序列预训练的神经机器翻译（LREC2020）和基于语言驱动的多任务预训练的低资源神经机器翻译（ACM TALLIP）。",
                    "zh-hant": "JASS：針對日本特定序列的序列到序列預訓練，用於神經機器翻譯（LREC2020）和基於語言學的多任務預訓練，用於低資源神經機器翻譯（ACM TALLIP）。"
                }
            },
            "https://github.com/cl-tohoku/PheMT": {
                "sub_category": "Machine translation",
                "repository_name": "PheMT",
                "user_name": "cl-tohoku",
                "description": "A phenomenon-wise evaluation dataset for Japanese-English machine translation robustness. The dataset is based on the MTNT dataset, with additional annotations of four linguistic phenomena; Proper Noun, Abbreviated Noun, Colloquial Expression, and Variant. COLING 2020.",
                "multilingual_descriptions": {
                    "en": "A phenomenon-wise evaluation dataset for Japanese-English machine translation robustness. The dataset is based on the MTNT dataset, with additional annotations of four linguistic phenomena; Proper Noun, Abbreviated Noun, Colloquial Expression, and Variant. COLING 2020.",
                    "ja": "日英機械翻訳の堅牢性に関する現象別評価データセット。このデータセットは、MTNTデータセットをベースに、固有名詞、略語、口語表現、および変異形の4つの言語現象の追加注釈を含んでいます。COLING 2020。",
                    "zh-hans": "一份针对日英机器翻译鲁棒性的现象级评估数据集。该数据集基于MTNT数据集，额外注释了四种语言现象：专有名词、缩写名词、口语表达和变体。COLING 2020。",
                    "zh-hant": "一個針對日英機器翻譯韌性的現象級評估數據集。該數據集基於MTNT數據集，並附加了四種語言現象的註釋；專有名詞、縮寫名詞、口語表達和變體。COLING 2020。"
                }
            },
            "https://github.com/ku-nlp/VISA": {
                "sub_category": "Machine translation",
                "repository_name": "VISA",
                "user_name": "ku-nlp",
                "description": "An ambiguous subtitles dataset for visual scene-aware machine translation",
                "multilingual_descriptions": {
                    "en": "An ambiguous subtitles dataset for visual scene-aware machine translation",
                    "ja": "視覚シーンに関する機械翻訳のための曖昧な字幕データセット",
                    "zh-hans": "一份用于视觉场景感知机器翻译的模糊字幕数据集",
                    "zh-hant": "一個用於視覺場景感知機器翻譯的模糊字幕數據集"
                }
            },
            "https://github.com/chakki-works/namaco": {
                "sub_category": "Named entity recognition",
                "repository_name": "namaco",
                "user_name": "chakki-works",
                "description": "Character Based Named Entity Recognition.",
                "multilingual_descriptions": {
                    "en": "Character Based Named Entity Recognition.",
                    "ja": "文字ベースの固有表現認識。",
                    "zh-hans": "基于字符的命名实体识别。",
                    "zh-hant": "基於字元的命名實體識別。"
                }
            },
            "https://github.com/chakki-works/entitypedia": {
                "sub_category": "Named entity recognition",
                "repository_name": "entitypedia",
                "user_name": "chakki-works",
                "description": "Entitypedia is an Extended Named Entity Dictionary from Wikipedia.",
                "multilingual_descriptions": {
                    "en": "Entitypedia is an Extended Named Entity Dictionary from Wikipedia.",
                    "ja": "Entitypediaは、Wikipediaからの拡張された固有名詞辞書です。",
                    "zh-hans": "Entitypedia是来自维基百科的扩展命名实体词典。",
                    "zh-hant": "Entitypedia是一個從維基百科擴展出來的命名實體詞典。"
                }
            },
            "https://github.com/ken11/noyaki": {
                "sub_category": "Named entity recognition",
                "repository_name": "noyaki",
                "user_name": "ken11",
                "description": "Converts character span label information to tokenized text-based label information.",
                "multilingual_descriptions": {
                    "en": "Converts character span label information to tokenized text-based label information.",
                    "ja": "文字の範囲ラベル情報をトークン化されたテキストベースのラベル情報に変換します。",
                    "zh-hans": "将字符跨度标签信息转换为基于分词文本的标签信息。",
                    "zh-hant": "將字符跨度標籤信息轉換為基於分詞文本的標籤信息。"
                }
            },
            "https://github.com/ken11/bert-japanese-ner-finetuning": {
                "sub_category": "Named entity recognition",
                "repository_name": "bert-japanese-ner-finetuning",
                "user_name": "ken11",
                "description": "Code to perform finetuning of the BERT model. BERTモデルのファインチューニングで固有表現抽出用タスクのモデルを作成・使用するサンプルです",
                "multilingual_descriptions": {
                    "en": "This is a sample code for creating and using a model for named entity recognition task through finetuning of the BERT model.",
                    "ja": "Code to perform finetuning of the BERT model. BERTモデルのファインチューニングで固有表現抽出用タスクのモデルを作成・使用するサンプルです",
                    "zh-hans": "用于BERT模型微调的代码。这是一个用于创建和使用用于命名实体识别任务的模型的示例。",
                    "zh-hant": "用於BERT模型微調的代碼。這是用於創建和使用用於實體識別任務的模型的BERT模型微調示例。"
                }
            },
            "https://github.com/aih-uth/joint-information-extraction-hs": {
                "sub_category": "Named entity recognition",
                "repository_name": "joint-information-extraction-hs",
                "user_name": "aih-uth",
                "description": "詳細なアノテーション基準に基づく症例報告コーパスからの固有表現及び関係の抽出精度の推論を行うコード",
                "multilingual_descriptions": {
                    "en": "Code for inferring the accuracy of named entity and relation extraction from a case report corpus based on detailed annotation criteria.",
                    "ja": "詳細なアノテーション基準に基づく症例報告コーパスからの固有表現及び関係の抽出精度の推論を行うコード",
                    "zh-hans": "基于详细的注释标准的病例报告语料库，进行实体和关系抽取精度推理的代码。",
                    "zh-hant": "從基於詳細註釋標準的病例報告語料庫中進行固有表達和關係抽取精度推論的代碼。"
                }
            },
            "https://github.com/geonlp-platform/pygeonlp": {
                "sub_category": null,
                "repository_name": "pygeonlp",
                "user_name": "geonlp-platform",
                "description": "pygeonlp, A python module for geotagging Japanese texts.",
                "multilingual_descriptions": {
                    "en": "pygeonlp, A python module for geotagging Japanese texts.",
                    "ja": "pygeonlpは、日本語テキストのジオタギングに使用するPythonモジュールです。",
                    "zh-hans": "pygeonlp，一个用于对日语文本进行地理标记的Python模块。",
                    "zh-hant": "pygeonlp，一個用於對日文文本進行地理標記的Python模塊。"
                }
            },
            "https://github.com/jurabiinc/bert-ner-japanese": {
                "sub_category": "Named entity recognition",
                "repository_name": "bert-ner-japanese",
                "user_name": "jurabiinc",
                "description": "BERTによる日本語固有表現抽出のファインチューニング用プログラム",
                "multilingual_descriptions": {
                    "en": "Program for fine-tuning Japanese named entity recognition using BERT",
                    "ja": "BERTによる日本語固有表現抽出のファインチューニング用プログラム",
                    "zh-hans": "使用BERT进行日语命名实体抽取的微调程序",
                    "zh-hant": "BERT進行日語固有表現抽取的微調程式"
                }
            },
            "https://github.com/tsmatz/huggingface-finetune-japanese": {
                "sub_category": "Named entity recognition",
                "repository_name": "huggingface-finetune-japanese",
                "user_name": "tsmatz",
                "description": "Examples to finetune encoder-only and encoder-decoder transformers for Japanese language (Hugging Face) Resources",
                "multilingual_descriptions": {
                    "en": "Examples to finetune encoder-only and encoder-decoder transformers for Japanese language (Hugging Face) Resources",
                    "ja": "日本語の言語（Hugging Face）リソースのためにエンコーダーのみとエンコーダーデコーダーのトランスフォーマーを微調整するための例",
                    "zh-hans": "用于调整仅编码器和编码器-解码器变压器以适应日语的示例（Hugging Face）资源",
                    "zh-hant": "用於日語語言（Hugging Face）資源的調整編碼器和編碼器-解碼器變壓器的示例\n用於日語語言（Hugging Face）資源的調整編碼器和編碼器-解碼器變壓器的示例"
                }
            },
            "https://github.com/kha-white/manga-ocr": {
                "sub_category": "OCR",
                "repository_name": "manga-ocr",
                "user_name": "kha-white",
                "description": "About Optical character recognition for Japanese text, with the main focus being Japanese manga",
                "multilingual_descriptions": {
                    "en": "About Optical character recognition for Japanese text, with the main focus being Japanese manga",
                    "ja": "日本語のマンガを中心に、光学文字認識についての説明。",
                    "zh-hans": "关于日文文本的光学字符识别，主要关注于日本漫画。",
                    "zh-hant": "關於日文文字的光學字符識別，主要聚焦於日本漫畫。"
                }
            },
            "https://github.com/kha-white/mokuro": {
                "sub_category": "OCR",
                "repository_name": "mokuro",
                "user_name": "kha-white",
                "description": "Read Japanese manga inside browser with selectable text.",
                "multilingual_descriptions": {
                    "en": "Read Japanese manga inside browser with selectable text.",
                    "ja": "ブラウザ内で選択可能なテキストで日本のマンガを読む。",
                    "zh-hans": "在浏览器中阅读日本漫画，可选择文本。",
                    "zh-hant": "在瀏覽器中閱讀日本漫畫，並可選擇文字。"
                }
            },
            "https://github.com/yas-sim/handwritten-japanese-ocr": {
                "sub_category": "OCR",
                "repository_name": "handwritten-japanese-ocr",
                "user_name": "yas-sim",
                "description": "Handwritten Japanese OCR demo using touch panel to draw the input text using Intel OpenVINO toolkit",
                "multilingual_descriptions": {
                    "en": "Handwritten Japanese OCR demo using touch panel to draw the input text using Intel OpenVINO toolkit",
                    "ja": "インテルのOpenVINOツールキットを使用して、タッチパネルを使って入力テキストを描画する手書き日本語OCRデモ",
                    "zh-hans": "使用Intel OpenVINO工具包，通过触摸面板绘制输入文本的手写日语OCR演示。",
                    "zh-hant": "手寫日文OCR演示，使用觸控面板繪製輸入文本，使用Intel OpenVINO工具包。"
                }
            },
            "https://github.com/tanreinama/OCR_Japanease": {
                "sub_category": "OCR",
                "repository_name": "OCR_Japanease",
                "user_name": "tanreinama",
                "description": "日本語OCR",
                "multilingual_descriptions": {
                    "en": "Japanese OCR",
                    "ja": "Japanese OCR",
                    "zh-hans": "日语OCR",
                    "zh-hant": "日本語OCR"
                }
            },
            "https://github.com/ndl-lab/ndlocr_cli": {
                "sub_category": "OCR",
                "repository_name": "ndlocr_cli",
                "user_name": "ndl-lab",
                "description": "NDLOCRのアプリケーション",
                "multilingual_descriptions": {
                    "en": "NDLOCR application",
                    "ja": "NDLOCRのアプリケーション",
                    "zh-hans": "NDLOCR应用程序",
                    "zh-hant": "NDLOCR的應用程式"
                }
            },
            "https://github.com/clovaai/donut": {
                "sub_category": "OCR",
                "repository_name": "donut",
                "user_name": "clovaai",
                "description": "Official Implementation of OCR-free Document Understanding Transformer (Donut) and Synthetic Document Generator (SynthDoG), ECCV 2022",
                "multilingual_descriptions": {
                    "en": "Official Implementation of OCR-free Document Understanding Transformer (Donut) and Synthetic Document Generator (SynthDoG), ECCV 2022",
                    "ja": "OCRフリー文書理解トランスフォーマー（Donut）および合成文書ジェネレーター（SynthDoG）の公式実装、ECCV 2022",
                    "zh-hans": "OCR-free文档理解变压器（Donut）和合成文档生成器（SynthDoG）的官方实现，ECCV 2022",
                    "zh-hant": "OCR-free文件理解轉換器（Donut）和合成文件生成器（SynthDoG）的官方實施，ECCV 2022"
                }
            },
            "https://github.com/ttop32/JMTrans": {
                "sub_category": "OCR",
                "repository_name": "JMTrans",
                "user_name": "ttop32",
                "description": "get japanese manga from url to translate manga image",
                "multilingual_descriptions": {
                    "en": "Manga translator - retrieve Japanese manga from URL to translate manga images.",
                    "ja": "マンガ翻訳者 - URLから日本のマンガを取得してマンガ画像を翻訳する",
                    "zh-hans": "漫画翻译器 - 从网址获取日本漫画以翻译漫画图像",
                    "zh-hant": "漫畫翻譯器 - 從網址獲取日本漫畫以翻譯漫畫圖像"
                }
            },
            "https://github.com/ducanh841988/Kindai-OCR": {
                "sub_category": "OCR",
                "repository_name": "Kindai-OCR",
                "user_name": "ducanh841988",
                "description": "OCR system for recognizing modern Japanese magazines",
                "multilingual_descriptions": {
                    "en": "OCR system for recognizing modern Japanese magazines",
                    "ja": "現代日本の雑誌を認識するOCRシステム",
                    "zh-hans": "用于识别现代日本杂志的OCR系统",
                    "zh-hant": "識別現代日本雜誌的OCR系統"
                }
            },
            "https://github.com/ndl-lab/text_recognition": {
                "sub_category": "OCR",
                "repository_name": "text_recognition",
                "user_name": "ndl-lab",
                "description": "NDLOCR用テキスト認識モジュール",
                "multilingual_descriptions": {
                    "en": "Text recognition module for NDLOCR.",
                    "ja": "NDLOCR用テキスト認識モジュール",
                    "zh-hans": "NDLOCR文本识别模块",
                    "zh-hant": "NDLOCR使用文字識別模組"
                }
            },
            "https://github.com/blueaxis/Poricom": {
                "sub_category": "OCR",
                "repository_name": "Poricom",
                "user_name": "blueaxis",
                "description": "Optical character recognition in manga images. Manga OCR desktop application",
                "multilingual_descriptions": {
                    "en": "Optical character recognition in manga images. Manga OCR desktop application",
                    "ja": "漫画画像の光学文字認識。漫画OCRデスクトップアプリケーション。",
                    "zh-hans": "漫画图像的光学字符识别。漫画OCR桌面应用程序。",
                    "zh-hant": "漫畫圖像的光學字符識別。漫畫OCR桌面應用程式。"
                }
            },
            "https://github.com/aurorawright/owocr": {
                "sub_category": "OCR",
                "repository_name": "owocr",
                "user_name": "aurorawright",
                "description": "Optical character recognition for Japanese text",
                "multilingual_descriptions": {
                    "en": "Optical character recognition for Japanese text",
                    "ja": "日本語テキストの光学文字認識",
                    "zh-hans": "日文文本的光学字符识别",
                    "zh-hant": "日文文本的光學字符識別"
                }
            },
            "https://github.com/kotaro-kinoshita/yomitoku": {
                "sub_category": "OCR",
                "repository_name": "yomitoku",
                "user_name": "kotaro-kinoshita",
                "description": "Yomitoku is an AI-powered document image analysis package designed specifically for the Japanese language.",
                "multilingual_descriptions": {
                    "en": "Yomitoku is an AI-powered document image analysis package designed specifically for the Japanese language.",
                    "ja": "Yomitokuは、日本語に特化したAIパワードのドキュメント画像解析パッケージです。",
                    "zh-hans": "Yomitoku是一款由人工智能驱动的文件图像分析软件包，专门为日语设计。",
                    "zh-hant": "Yomitoku是一個專為日語設計的AI驅動的文件圖像分析套件。"
                }
            },
            "https://github.com/lithium0003/findtextcenternet": {
                "sub_category": "OCR",
                "repository_name": "findtextcenternet",
                "user_name": "lithium0003",
                "description": "Japanese OCR with CenterNet",
                "multilingual_descriptions": {
                    "en": "Japanese OCR with CenterNet",
                    "ja": "センターネットを使用した日本語OCR",
                    "zh-hans": "使用CenterNet的日语OCR",
                    "zh-hant": "使用CenterNet的日文OCR"
                }
            },
            "https://github.com/yahoojapan/JGLUE": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "JGLUE",
                "user_name": "yahoojapan",
                "description": "JGLUE: Japanese General Language Understanding Evaluation",
                "multilingual_descriptions": {
                    "en": "JGLUE: Japanese General Language Understanding Evaluation",
                    "ja": "JGLUE：日本語一般言語理解評価",
                    "zh-hans": "JGLUE：日本通用语言理解评估",
                    "zh-hant": "JGLUE：日本通用語言理解評估"
                }
            },
            "https://github.com/megagonlabs/ginza-transformers": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "ginza-transformers",
                "user_name": "megagonlabs",
                "description": "Use custom tokenizers in spacy-transformers",
                "multilingual_descriptions": {
                    "en": "Use custom tokenizers in spacy-transformers",
                    "ja": "spacy-transformersでカスタムトークナイザーを使用する",
                    "zh-hans": "在spacy-transformers中使用自定义分词器",
                    "zh-hant": "在spacy-transformers中使用自定義分詞器"
                }
            },
            "https://github.com/Jinyamyzk/t5_japanese_dialogue_generation": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "t5_japanese_dialogue_generation",
                "user_name": "Jinyamyzk",
                "description": "T5による会話生成",
                "multilingual_descriptions": {
                    "en": "Conversation generation using T5.",
                    "ja": "T5による会話生成",
                    "zh-hans": "使用T5生成对话",
                    "zh-hant": "使用T5生成對話"
                }
            },
            "https://github.com/Masao-Taketani/japanese_text_classification": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "japanese_text_classification",
                "user_name": "Masao-Taketani",
                "description": "To investigate various DNN text classifiers including MLP, CNN, RNN, BERT approaches.",
                "multilingual_descriptions": {
                    "en": "To investigate various DNN text classifiers including MLP, CNN, RNN, BERT approaches.",
                    "ja": "MLP、CNN、RNN、BERTアプローチを含む様々なDNNテキスト分類器を調査する。",
                    "zh-hans": "调查各种DNN文本分类器，包括MLP、CNN、RNN、BERT方法。",
                    "zh-hant": "調查各種DNN文本分類器，包括MLP、CNN、RNN、BERT方法。"
                }
            },
            "https://github.com/izuna385/Japanese-BERT-Sentiment-Analyzer": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "Japanese-BERT-Sentiment-Analyzer",
                "user_name": "izuna385",
                "description": "Deploying sentiment analysis server with FastAPI and BERT",
                "multilingual_descriptions": {
                    "en": "Deploying sentiment analysis server with FastAPI and BERT",
                    "ja": "FastAPIとBERTを使用して感情分析サーバーを展開する",
                    "zh-hans": "使用FastAPI和BERT部署情感分析服务器",
                    "zh-hant": "使用FastAPI和BERT部署情感分析伺服器"
                }
            },
            "https://github.com/minhpqn/jmlm_scoring": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "jmlm_scoring",
                "user_name": "minhpqn",
                "description": "Masked Language Model-based Scoring for Japanese and Vietnamese",
                "multilingual_descriptions": {
                    "en": "Masked Language Model-based Scoring for Japanese and Vietnamese",
                    "ja": "日本語とベトナム語のためのマスクされた言語モデルに基づくスコアリング",
                    "zh-hans": "基于掩码语言模型的日语和越南语评分",
                    "zh-hant": "基於遮蔽語言模型的日語和越南語評分"
                }
            },
            "https://github.com/shunk031/allennlp-shiba-model": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "allennlp-shiba-model",
                "user_name": "shunk031",
                "description": "AllenNLP integration for Shiba: Japanese CANINE model",
                "multilingual_descriptions": {
                    "en": "AllenNLP integration for Shiba: Japanese CANINE model",
                    "ja": "ShibaのためのAllenNLP統合：日本のCANINEモデル",
                    "zh-hans": "Shiba的AllenNLP集成：日本CANINE模型",
                    "zh-hant": "Shiba 的 AllenNLP 整合：日本 CANINE 模型"
                }
            },
            "https://github.com/shihono/evaluate_japanese_w2v": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "evaluate_japanese_w2v",
                "user_name": "shihono",
                "description": "script to evaluate pre-trained Japanese word2vec model on Japanese similarity dataset",
                "multilingual_descriptions": {
                    "en": "script to evaluate pre-trained Japanese word2vec model on Japanese similarity dataset",
                    "ja": "日本語の類似度データセットで事前学習された日本語word2vecモデルを評価するスクリプト",
                    "zh-hans": "用于评估预训练的日语word2vec模型在日语相似性数据集上的脚本",
                    "zh-hant": "用於評估預先訓練的日語word2vec模型的日語相似性數據集腳本"
                }
            },
            "https://github.com/jonnyli1125/gector-ja": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "gector-ja",
                "user_name": "jonnyli1125",
                "description": "BERT-based GEC tagging for Japanese",
                "multilingual_descriptions": {
                    "en": "BERT-based GEC tagging for Japanese",
                    "ja": "日本語のBERTベースのGECタグ付け",
                    "zh-hans": "基于BERT的日语GEC标记",
                    "zh-hant": "基於BERT的日語GEC標記"
                }
            },
            "https://github.com/tanreinama/Japanese-BPEEncoder": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "Japanese-BPEEncoder",
                "user_name": "tanreinama",
                "description": "Japanese-BPEEncoder",
                "multilingual_descriptions": {
                    "en": "日本語-BPEエンコーダー",
                    "ja": "日本語-BPEエンコーダー",
                    "zh-hans": "日语-BPE编码器",
                    "zh-hant": "日本語-BPE編碼器"
                }
            },
            "https://github.com/tanreinama/Japanese-BPEEncoder_V2": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "Japanese-BPEEncoder_V2",
                "user_name": "tanreinama",
                "description": "Japanese-BPEEncoder Version 2",
                "multilingual_descriptions": {
                    "en": "Japanese-BPEEncoder Version 2",
                    "ja": "日本語-BPEエンコーダー バージョン2",
                    "zh-hans": "日语-BPE编码器版本2",
                    "zh-hant": "日本語-BPE編碼器版本2"
                }
            },
            "https://github.com/youichiro/transformer-copy": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "transformer-copy",
                "user_name": "youichiro",
                "description": "日本語文法誤り訂正ツール",
                "multilingual_descriptions": {
                    "en": "Japanese grammar error correction tool",
                    "ja": "日本語文法誤り訂正ツール",
                    "zh-hans": "日语语法错误校正工具",
                    "zh-hant": "日本語文法錯誤訂正工具"
                }
            },
            "https://github.com/rinnakk/japanese-stable-diffusion": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "japanese-stable-diffusion",
                "user_name": "rinnakk",
                "description": "Japanese Stable Diffusion is a Japanese specific latent text-to-image diffusion model capable of generating photo-realistic images given any text input.",
                "multilingual_descriptions": {
                    "en": "Japanese Stable Diffusion is a Japanese specific latent text-to-image diffusion model capable of generating photo-realistic images given any text input.",
                    "ja": "日本語ステーブル拡散は、任意のテキスト入力に対して写真のようなリアルな画像を生成することができる、日本特有の潜在的なテキストから画像への拡散モデルです。",
                    "zh-hans": "日本稳定扩散是一种日本特有的潜在文本到图像扩散模型，能够根据任何文本输入生成逼真的照片。",
                    "zh-hant": "日本穩定擴散是一種日本特有的潛在文本到圖像擴散模型，能夠生成逼真的照片般的圖像，並接受任何文本輸入。"
                }
            },
            "https://github.com/taishi-i/nagisa_bert": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "nagisa_bert",
                "user_name": "taishi-i",
                "description": "A BERT model for nagisa",
                "multilingual_descriptions": {
                    "en": "A BERT model for Nagisa.",
                    "ja": "nagisa用のBERTモデル",
                    "zh-hans": "一个用于nagisa的BERT模型",
                    "zh-hant": "一個針對nagisa的BERT模型"
                }
            },
            "https://github.com/rinnakk/prefix-tuning-gpt": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "prefix-tuning-gpt",
                "user_name": "rinnakk",
                "description": "Example code for prefix-tuning GPT/GPT-NeoX models and for inference with trained prefixes",
                "multilingual_descriptions": {
                    "en": "Example code for prefix-tuning GPT/GPT-NeoX models and for inference with trained prefixes",
                    "ja": "トレーニング済みのプレフィックスを使用したGPT/GPT-NeoXモデルのプレフィックスチューニングの例コードと推論のためのコード。",
                    "zh-hans": "用于前缀调整GPT/GPT-NeoX模型的示例代码以及使用训练好的前缀进行推理的代码。",
                    "zh-hant": "前綴調整 GPT/GPT-NeoX 模型的範例代碼以及使用訓練過的前綴進行推論的代碼。"
                }
            },
            "https://github.com/nobu-g/JGLUE-benchmark": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "JGLUE-benchmark",
                "user_name": "nobu-g",
                "description": "Training and evaluation scripts for JGLUE, a Japanese language understanding benchmark",
                "multilingual_descriptions": {
                    "en": "Training and evaluation scripts for JGLUE, a Japanese language understanding benchmark",
                    "ja": "JGLUEのトレーニングと評価スクリプト、日本語理解ベンチマーク用",
                    "zh-hans": "JGLUE的训练和评估脚本，是一个日语理解基准测试。",
                    "zh-hant": "JGLUE的訓練和評估腳本，這是一個日語理解基準測試。"
                }
            },
            "https://github.com/retarfi/jptranstokenizer": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "jptranstokenizer",
                "user_name": "retarfi",
                "description": "Japanese Tokenizer for transformers library",
                "multilingual_descriptions": {
                    "en": "日本語のトークナイザー（分かち書きツール）をTransformersライブラリ用に作成しました。",
                    "ja": "トランスフォーマーライブラリの日本語トークナイザー",
                    "zh-hans": "Transformers库的日语分词器",
                    "zh-hant": "Transformers 库的日语分词器"
                }
            },
            "https://github.com/Stability-AI/lm-evaluation-harness/tree/jp-stable": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "jp-stable",
                "user_name": "tree",
                "description": "JP Language Model Evaluation Harness",
                "multilingual_descriptions": {
                    "en": "JP Language Model Evaluation Harness",
                    "ja": "JP言語モデル評価ハーネス",
                    "zh-hans": "JP语言模型评估工具",
                    "zh-hant": "JP 語言模型評估工具"
                }
            },
            "https://github.com/hitachi-nlp/compare-ja-tokenizer": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "compare-ja-tokenizer",
                "user_name": "hitachi-nlp",
                "description": "How do different tokenizers perform on downstream tasks in scriptio continua languages?: A case study in Japanese-ACL SRW 2023",
                "multilingual_descriptions": {
                    "en": "How do different tokenizers perform on downstream tasks in scriptio continua languages?: A case study in Japanese - ACL SRW 2023",
                    "ja": "異なるトークナイザーは、スクリプト連続言語における下流タスクでどのように機能するか？：日本語のケーススタディ - ACL SRW 2023",
                    "zh-hans": "不同的分词器在连续书写语言的下游任务中表现如何？：以日语为例的案例研究 - ACL SRW 2023",
                    "zh-hant": "不同的分詞器在連續書寫語言的下游任務中表現如何？：以日語為例的案例研究 - ACL SRW 2023"
                }
            },
            "https://github.com/tdc-yamada-ya/lm-evaluation-harness-jp-stable": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "lm-evaluation-harness-jp-stable",
                "user_name": "tdc-yamada-ya",
                "description": "A framework for few-shot evaluation of autoregressive language models.",
                "multilingual_descriptions": {
                    "en": "A framework for few-shot evaluation of autoregressive language models.",
                    "ja": "自己回帰言語モデルの少数ショット評価のためのフレームワーク。",
                    "zh-hans": "一个用于自回归语言模型少样本评估的框架。",
                    "zh-hant": "一個用於少樣本評估自回歸語言模型的框架。"
                }
            },
            "https://github.com/hppRC/llm-lora-classification": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "llm-lora-classification",
                "user_name": "hppRC",
                "description": "llm-lora-classification",
                "multilingual_descriptions": {
                    "en": "llm-lora-classification",
                    "ja": "llm-lora-classification\nllm-lora-分類",
                    "zh-hans": "llm-lora-classification\nllm-lora-分类",
                    "zh-hant": "llm-lora-classification"
                }
            },
            "https://github.com/yukaryavka/rinna_gpt-neox_ggml-lora": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "rinna_gpt-neox_ggml-lora",
                "user_name": "yukaryavka",
                "description": "The repository contains scripts and merge scripts that have been modified to adapt an Alpaca-Lora adapter for LoRA tuning when assuming the use of the \"rinna/japanese-gpt-neox...\" [gpt-neox] model converted to ggml.",
                "multilingual_descriptions": {
                    "en": "The repository contains scripts and merge scripts that have been modified to adapt an Alpaca-Lora adapter for LoRA tuning when assuming the use of the \"rinna/japanese-gpt-neox...\" [gpt-neox] model converted to ggml.",
                    "ja": "このリポジトリには、\"rinna/japanese-gpt-neox...\" [gpt-neox] モデルをggmlに変換した場合に、Alpaca-LoraアダプターをLoRAチューニングに適応させるために修正されたスクリプトとマージスクリプトが含まれています。",
                    "zh-hans": "该存储库包含已修改的脚本和合并脚本，用于适应Alpaca-Lora适配器的LoRA调谐，假设使用转换为ggml的\"gpt-neox\"模型的\"rinna/japanese-gpt-neox...\"。\n该存储库包含已修改的脚本和合并脚本，用于适应Alpaca-Lora适配器的LoRA调谐，假设使用转换为ggml的\"gpt-neox\"模型的\"rinna/japanese-gpt-neox...\"。",
                    "zh-hant": "該存儲庫包含已修改的腳本和合併腳本，用於將Alpaca-Lora適配器調整為支持LoRA調諧，假設使用了“rinna/japanese-gpt-neox...” [gpt-neox]模型轉換為ggml。"
                }
            },
            "https://github.com/oshizo/japanese-llm-roleplay-benchmark": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "japanese-llm-roleplay-benchmark",
                "user_name": "oshizo",
                "description": "このリポジトリは日本語LLMのキャラクターロールプレイに関する性能を評価するために作成しました。",
                "multilingual_descriptions": {
                    "en": "This repository was created to evaluate the performance of character role-playing in Japanese LLM.",
                    "ja": "このリポジトリは日本語LLMのキャラクターロールプレイに関する性能を評価するために作成しました。",
                    "zh-hans": "这个存储库是为了评估日本语LLM角色扮演的性能而创建的。",
                    "zh-hant": "這個存儲庫是為了評估日本語LLM的角色扮演性能而創建的。"
                }
            },
            "https://github.com/yuzu-ai/japanese-llm-ranking": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "japanese-llm-ranking",
                "user_name": "yuzu-ai",
                "description": "This repository supports YuzuAI's Rakuda leaderboard of Japanese LLMs, which is a Japanese-focused analogue of LMSYS' Vicuna eval.",
                "multilingual_descriptions": {
                    "en": "This repository supports YuzuAI's Rakuda leaderboard of Japanese LLMs, which is a Japanese-focused analogue of LMSYS' Vicuna eval.",
                    "ja": "このリポジトリは、YuzuAIのラクダリーダーボードをサポートしています。ラクダリーダーボードは、LMSYSのビクーナ評価の日本に特化した類似物です。",
                    "zh-hans": "该存储库支持YuzuAI的Rakuda排行榜，该排行榜是日本LLMs的日本重点模拟版本，类似于LMSYS的Vicuna评估。",
                    "zh-hant": "這個儲存庫支援YuzuAI的Rakuda排行榜，該排行榜是日本語言模型的日本專用版本，類似於LMSYS的Vicuna評估。"
                }
            },
            "https://github.com/llm-jp/llm-jp-eval": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "llm-jp-eval",
                "user_name": "llm-jp",
                "description": "このツールは、複数のデータセットを横断して日本語の大規模言語モデルを自動評価するものです．",
                "multilingual_descriptions": {
                    "en": "This tool is designed to automatically evaluate large-scale Japanese language models across multiple datasets.",
                    "ja": "このツールは、複数のデータセットを横断して日本語の大規模言語モデルを自動評価するものです．",
                    "zh-hans": "这个工具可以跨多个数据集对日语大规模语言模型进行自动评估。",
                    "zh-hant": "這個工具可以跨多個數據集對日語大規模語言模型進行自動評估。"
                }
            },
            "https://github.com/llm-jp/llm-jp-sft": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "llm-jp-sft",
                "user_name": "llm-jp",
                "description": "This repository contains the code for supervised fine-tuning of LLM-jp models.",
                "multilingual_descriptions": {
                    "en": "This repository contains the code for supervised fine-tuning of LLM-jp models.",
                    "ja": "このリポジトリには、LLM-jpモデルの教師ありファインチューニングのためのコードが含まれています。",
                    "zh-hans": "该存储库包含了LLM-jp模型的监督微调代码。",
                    "zh-hant": "此存儲庫包含了LLM-jp模型的監督微調代碼。"
                }
            },
            "https://github.com/llm-jp/llm-jp-tokenizer": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "llm-jp-tokenizer",
                "user_name": "llm-jp",
                "description": "LLM勉強会（LLM-jp）で開発しているLLM用のトークナイザー関連をまとめたリポジトリです．",
                "multilingual_descriptions": {
                    "en": "This is a repository that summarizes the tokenizer related to LLM being developed at the LLM Study Group (LLM-jp).",
                    "ja": "LLM勉強会（LLM-jp）で開発しているLLM用のトークナイザー関連をまとめたリポジトリです．",
                    "zh-hans": "这是一个整理了在LLM勉强会（LLM-jp）中开发的与LLM的分词器相关的存储库。",
                    "zh-hant": "這是一個整理了在LLM勉強會（LLM-jp）中開發的與LLM用戶端相關的分詞器的存儲庫。"
                }
            },
            "https://github.com/pfnet-research/japanese-lm-fin-harness": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "japanese-lm-fin-harness",
                "user_name": "pfnet-research",
                "description": "Japanese Language Model Financial Evaluation Harness",
                "multilingual_descriptions": {
                    "en": "日本語言模型金融评估工具",
                    "ja": "日本語言語モデルの金融評価ハーネス",
                    "zh-hans": "日语语言模型金融评估工具",
                    "zh-hant": "日語語言模型金融評估工具"
                }
            },
            "https://github.com/ku-nlp/ja-vicuna-qa-benchmark": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "ja-vicuna-qa-benchmark",
                "user_name": "ku-nlp",
                "description": "Japanese Vicuna QA Benchmark",
                "multilingual_descriptions": {
                    "en": "Japanese Vicuna QA Benchmark",
                    "ja": "日本のビクーニャQAベンチマーク",
                    "zh-hans": "日本维库纳问答基准",
                    "zh-hant": "日本維卡尼亞QA基準"
                }
            },
            "https://github.com/swallow-llm/swallow-evaluation": {
                "sub_category": "Tool for pretrained models",
                "repository_name": "swallow-evaluation",
                "user_name": "swallow-llm",
                "description": "Swallowプロジェクト 大規模言語モデル 評価スクリプト",
                "multilingual_descriptions": {
                    "en": "Swallow Project Large-Scale Language Model Evaluation Script",
                    "ja": "Swallowプロジェクト 大規模言語モデル 評価スクリプト",
                    "zh-hans": "燕子项目 大规模语言模型 评估脚本",
                    "zh-hant": "燕子項目 大規模語言模型 評估腳本"
                }
            },
            "https://github.com/rskmoi/namedivider-python": {
                "sub_category": null,
                "repository_name": "namedivider-python",
                "user_name": "rskmoi",
                "description": "A tool for dividing the Japanese full name into a family name and a given name.",
                "multilingual_descriptions": {
                    "en": "A tool for dividing the Japanese full name into a family name and a given name.",
                    "ja": "日本のフルネームを姓と名に分けるためのツール。",
                    "zh-hans": "一个将日本全名分成姓和名的工具。",
                    "zh-hant": "一個將日本全名分為姓氏和名字的工具。"
                }
            },
            "https://github.com/ikegami-yukino/asa-python": {
                "sub_category": null,
                "repository_name": "asa-python",
                "user_name": "ikegami-yukino",
                "description": "A curated list of resources dedicated to Python libraries of NLP for Japanese",
                "multilingual_descriptions": {
                    "en": "A curated list of resources dedicated to Python libraries of NLP for Japanese",
                    "ja": "日本語の自然言語処理のPythonライブラリに特化したリソースの厳選リスト",
                    "zh-hans": "一个精选的资源列表，专门介绍用于日语自然语言处理的Python库。",
                    "zh-hant": "一個精選的資源清單，專門為日語自然語言處理的Python庫而設。"
                }
            },
            "https://github.com/Takeuchi-Lab-LM/python_asa": {
                "sub_category": null,
                "repository_name": "python_asa",
                "user_name": "Takeuchi-Lab-LM",
                "description": "python版日本語意味役割付与システム（ASA）",
                "multilingual_descriptions": {
                    "en": "Python-based Japanese semantic role labeling system (ASA)",
                    "ja": "python版日本語意味役割付与システム（ASA）",
                    "zh-hans": "Python版日本语意义角色标注系统（ASA）",
                    "zh-hant": "Python版日本語意味角色賦予系統（ASA）"
                }
            },
            "https://github.com/taishi-i/toiro": {
                "sub_category": null,
                "repository_name": "toiro",
                "user_name": "taishi-i",
                "description": "A comparison tool of Japanese tokenizers",
                "multilingual_descriptions": {
                    "en": "A comparison tool of Japanese tokenizers",
                    "ja": "日本語トークナイザーの比較ツール",
                    "zh-hans": "日本分词工具比较工具",
                    "zh-hant": "日本語分詞器比較工具"
                }
            },
            "https://github.com/yagays/ja-timex": {
                "sub_category": null,
                "repository_name": "ja-timex",
                "user_name": "yagays",
                "description": "自然言語で書かれた時間情報表現を抽出/規格化するルールベースの解析器",
                "multilingual_descriptions": {
                    "en": "A rule-based parser for extracting/normalizing time expressions written in natural language.",
                    "ja": "自然言語で書かれた時間情報表現を抽出/規格化するルールベースの解析器",
                    "zh-hans": "基于规则的解析器，用于提取/规范自然语言中的时间信息表达。",
                    "zh-hant": "基於規則的解析器，用於提取/規範自然語言中的時間信息表達。"
                }
            },
            "https://github.com/Kensuke-Mitsuzawa/JapaneseTokenizers": {
                "sub_category": null,
                "repository_name": "JapaneseTokenizers",
                "user_name": "Kensuke-Mitsuzawa",
                "description": "A set of metrics for feature selection from text data",
                "multilingual_descriptions": {
                    "en": "A set of metrics for feature selection from text data",
                    "ja": "テキストデータからの特徴選択のためのメトリックのセット",
                    "zh-hans": "从文本数据中选择特征的一组度量标准",
                    "zh-hant": "從文本數據中選擇特徵的一組度量標準"
                }
            },
            "https://github.com/kajyuuen/daaja": {
                "sub_category": null,
                "repository_name": "daaja",
                "user_name": "kajyuuen",
                "description": "This repository has implementations of data augmentation for NLP for Japanese.",
                "multilingual_descriptions": {
                    "en": "This repository has implementations of data augmentation for NLP for Japanese.",
                    "ja": "このリポジトリには、日本語のNLPのためのデータ拡張の実装が含まれています。",
                    "zh-hans": "这个仓库包含了针对日语自然语言处理的数据增强实现。",
                    "zh-hant": "這個存儲庫包含了針對日語自然語言處理的數據增強實現。"
                }
            },
            "https://github.com/accel-brain/accel-brain-code": {
                "sub_category": null,
                "repository_name": "accel-brain-code",
                "user_name": "accel-brain",
                "description": "The purpose of this repository is to make prototypes as case study in the context of proof of concept(PoC) and research and development(R&D) that I have written in my website. The main research topics are Auto-Encoders in relation to the representation learning, the statistical machine learning for energy-based models, adversarial generation net…",
                "multilingual_descriptions": {
                    "en": "The purpose of this repository is to make prototypes as case study in the context of proof of concept(PoC) and research and development(R&D) that I have written in my website. The main research topics are Auto-Encoders in relation to the representation learning, the statistical machine learning for energy-based models, adversarial generation net…",
                    "ja": "このリポジトリの目的は、私がウェブサイトで書いた概念実証（PoC）および研究開発（R＆D）の文脈でプロトタイプをケーススタディとして作成することです。主な研究トピックは、表現学習に関連するオートエンコーダー、エネルギーベースモデルの統計的機械学習、敵対的生成ネットワークなどです...",
                    "zh-hans": "这个仓库的目的是在概念验证（PoC）和研究开发（R＆D）的背景下制作原型作为案例研究，这些案例研究我已经在我的网站上写过。主要研究主题是与表示学习相关的自动编码器，基于能量模型的统计机器学习，对抗生成网络等。",
                    "zh-hant": "這個存儲庫的目的是在概念證明（PoC）和研究開發（R＆D）的背景下製作原型作為案例研究，這些案例研究已經在我的網站上寫出來。主要研究主題是與表示學習相關的自動編碼器，基於能量模型的統計機器學習，對抗生成網絡..."
                }
            },
            "https://github.com/ku-nlp/kyoto-reader": {
                "sub_category": null,
                "repository_name": "kyoto-reader",
                "user_name": "ku-nlp",
                "description": "A processor for KyotoCorpus, KWDLC, and AnnotatedFKCCorpus",
                "multilingual_descriptions": {
                    "en": "A processor for KyotoCorpus, KWDLC, and AnnotatedFKCCorpus",
                    "ja": "京都コーパス、KWDLC、および注釈付きFKCコーパス用のプロセッサー",
                    "zh-hans": "一个用于KyotoCorpus、KWDLC和AnnotatedFKCCorpus的处理器。",
                    "zh-hant": "一個用於KyotoCorpus、KWDLC和AnnotatedFKCCorpus的處理器"
                }
            },
            "https://github.com/takapy0210/nlplot": {
                "sub_category": null,
                "repository_name": "nlplot",
                "user_name": "takapy0210",
                "description": "Visualization Module for Natural Language Processing",
                "multilingual_descriptions": {
                    "en": "Visualization Module for Natural Language Processing",
                    "ja": "自然言語処理の可視化モジュール",
                    "zh-hans": "自然语言处理可视化模块",
                    "zh-hant": "自然語言處理的可視化模組"
                }
            },
            "https://github.com/kanjirz50/rake-ja": {
                "sub_category": null,
                "repository_name": "rake-ja",
                "user_name": "kanjirz50",
                "description": "Rapid Automatic Keyword Extraction algorithm for Japanese",
                "multilingual_descriptions": {
                    "en": "Rapid Automatic Keyword Extraction algorithm for Japanese",
                    "ja": "日本語の高速自動キーワード抽出アルゴリズム",
                    "zh-hans": "用于日语的快速自动关键词提取算法",
                    "zh-hant": "日語快速自動關鍵詞提取演算法"
                }
            },
            "https://github.com/izuna385/jel": {
                "sub_category": null,
                "repository_name": "jel",
                "user_name": "izuna385",
                "description": "Japanese Entity Linker.",
                "multilingual_descriptions": {
                    "en": "Japanese Entity Linker.",
                    "ja": "日本語エンティティリンカー。",
                    "zh-hans": "日本实体链接器。",
                    "zh-hant": "日本實體連結器。"
                }
            },
            "https://github.com/sociocom/MedNER-J": {
                "sub_category": null,
                "repository_name": "MedNER-J",
                "user_name": "sociocom",
                "description": "Latest version of MedEX/J (Japanese disease name extractor)",
                "multilingual_descriptions": {
                    "en": "Latest version of MedEX/J (Japanese disease name extractor)",
                    "ja": "最新版のMedEX/J（日本語疾患名抽出ツール）",
                    "zh-hans": "最新版本的MedEX/J（日本疾病名称提取器）",
                    "zh-hant": "最新版本的MedEX/J（日本疾病名稱提取器）"
                }
            },
            "https://github.com/ikegami-yukino/zunda-python": {
                "sub_category": null,
                "repository_name": "zunda-python",
                "user_name": "ikegami-yukino",
                "description": "Zunda: Japanese Enhanced Modality Analyzer client for Python.",
                "multilingual_descriptions": {
                    "en": "Zunda: Japanese Enhanced Modality Analyzer client for Python.",
                    "ja": "Python用の日本語強調モダリティ解析クライアント「Zunda」。",
                    "zh-hans": "Zunda：Python的日语增强模态分析器客户端。",
                    "zh-hant": "Zunda：Python 的日本增強型情態分析器客戶端。"
                }
            },
            "https://github.com/cl-tohoku/AIO2_DPR_baseline": {
                "sub_category": null,
                "repository_name": "AIO2_DPR_baseline",
                "user_name": "cl-tohoku",
                "description": "https://www.nlp.ecei.tohoku.ac.jp/projects/aio/",
                "multilingual_descriptions": {
                    "en": "https://www.nlp.ecei.tohoku.ac.jp/projects/aio/",
                    "ja": "https://www.nlp.ecei.tohoku.ac.jp/projects/aio/ を入力してください。",
                    "zh-hans": "https://www.nlp.ecei.tohoku.ac.jp/projects/aio/ \n\nhttps://www.nlp.ecei.tohoku.ac.jp/projects/aio/",
                    "zh-hant": "https://www.nlp.ecei.tohoku.ac.jp/projects/aio/ \n\nhttps://www.nlp.ecei.tohoku.ac.jp/projects/aio/"
                }
            },
            "https://github.com/cl-tohoku/showcase": {
                "sub_category": null,
                "repository_name": "showcase",
                "user_name": "cl-tohoku",
                "description": "A PyTorch implementation of the Japanese Predicate-Argument Structure (PAS) analyser presented in the paper of Matsubayashi & Inui (2018) with some improvements.",
                "multilingual_descriptions": {
                    "en": "A PyTorch implementation of the Japanese Predicate-Argument Structure (PAS) analyser presented in the paper of Matsubayashi & Inui (2018) with some improvements.",
                    "ja": "Matsubayashi＆Inui（2018）の論文で紹介された日本語述語引数構造（PAS）解析器のPyTorch実装にいくつかの改良を加えました。",
                    "zh-hans": "一个PyTorch实现的日语谓词-论元结构（PAS）分析器，基于Matsubayashi＆Inui（2018）的论文，并进行了一些改进。",
                    "zh-hant": "一個PyTorch實現的日本述語-參數結構（PAS）分析器，該分析器在Matsubayashi＆Inui（2018）的論文中提出，並進行了一些改進。"
                }
            },
            "https://github.com/rixwew/darts-clone-python": {
                "sub_category": null,
                "repository_name": "darts-clone-python",
                "user_name": "rixwew",
                "description": "Darts-clone python binding",
                "multilingual_descriptions": {
                    "en": "Darts-clone python binding",
                    "ja": "ダーツクローンのPythonバインディング",
                    "zh-hans": "飞镖克隆 Python 绑定",
                    "zh-hant": "飛鏢克隆 Python 綁定"
                }
            },
            "https://github.com/megagonlabs/jrte-corpus_example": {
                "sub_category": null,
                "repository_name": "jrte-corpus_example",
                "user_name": "megagonlabs",
                "description": "Example codes for Japanese Realistic Textual Entailment Corpus",
                "multilingual_descriptions": {
                    "en": "Example codes for the Japanese Realistic Textual Entailment Corpus.",
                    "ja": "日本の現実的なテキスト推論コーパスの例コード",
                    "zh-hans": "日本现实文本蕴含语料库的示例代码",
                    "zh-hant": "日本寫實文本蘊含語料庫的範例代碼"
                }
            },
            "https://github.com/megagonlabs/desuwa": {
                "sub_category": null,
                "repository_name": "desuwa",
                "user_name": "megagonlabs",
                "description": "Feature annotator to morphemes and phrases based on KNP rule files (pure-Python)",
                "multilingual_descriptions": {
                    "en": "Feature annotator to morphemes and phrases based on KNP rule files (pure-Python)",
                    "ja": "KNPルールファイルに基づく形態素とフレーズの特徴注釈ツール（純粋なPython）",
                    "zh-hans": "基于KNP规则文件的特征注释器，可将单词和短语转换为形态素（纯Python实现）。",
                    "zh-hant": "基於KNP規則文件的特徵標註器，可將單詞和詞組轉換為形態素（純Python）"
                }
            },
            "https://github.com/Hironsan/HotPepperGourmetDialogue": {
                "sub_category": null,
                "repository_name": "HotPepperGourmetDialogue",
                "user_name": "Hironsan",
                "description": "Restaurant Search System through Dialogue in Japanese.",
                "multilingual_descriptions": {
                    "en": "Restaurant Search System through Dialogue in Japanese.",
                    "ja": "日本語による対話を通じたレストラン検索システム。",
                    "zh-hans": "通过日语对话的餐厅搜索系统。",
                    "zh-hant": "通過日語對話的餐廳搜索系統。"
                }
            },
            "https://github.com/upura/nlp-recipes-ja": {
                "sub_category": null,
                "repository_name": "nlp-recipes-ja",
                "user_name": "upura",
                "description": "Samples codes for natural language processing in Japanese",
                "multilingual_descriptions": {
                    "en": "Samples codes for natural language processing in Japanese",
                    "ja": "日本語の自然言語処理のサンプルコード",
                    "zh-hans": "日语自然语言处理的样本代码",
                    "zh-hant": "日語自然語言處理的樣本程式碼"
                }
            },
            "https://github.com/olsgaard/Japanese_nlp_scripts": {
                "sub_category": null,
                "repository_name": "Japanese_nlp_scripts",
                "user_name": "olsgaard",
                "description": "Small example scripts for working with Japanese texts in Python",
                "multilingual_descriptions": {
                    "en": "Small example scripts for working with Japanese texts in Python",
                    "ja": "Pythonで日本語テキストを扱うための小さなサンプルスクリプト",
                    "zh-hans": "Python处理日语文本的小例子脚本",
                    "zh-hant": "在Python中處理日文文本的小例子腳本"
                }
            },
            "https://github.com/sociocom/DNorm-J": {
                "sub_category": null,
                "repository_name": "DNorm-J",
                "user_name": "sociocom",
                "description": "Japanese version of DNorm",
                "multilingual_descriptions": {
                    "en": "Japanese version of DNorm",
                    "ja": "DNormの日本語版",
                    "zh-hans": "DNorm的日语版本",
                    "zh-hant": "DNorm的日文版本"
                }
            },
            "https://github.com/ku-nlp/pyknp-eventgraph": {
                "sub_category": null,
                "repository_name": "pyknp-eventgraph",
                "user_name": "ku-nlp",
                "description": "EventGraph is a development platform for high-level NLP applications in Japanese.",
                "multilingual_descriptions": {
                    "en": "EventGraph is a development platform for high-level NLP applications in Japanese.",
                    "ja": "EventGraphは、日本語の高度なNLPアプリケーションの開発プラットフォームです。",
                    "zh-hans": "EventGraph是一个用于日语高级自然语言处理应用程序开发的平台。",
                    "zh-hant": "EventGraph是一個針對高階日語自然語言處理應用的開發平台。"
                }
            },
            "https://github.com/ku-nlp/ishi": {
                "sub_category": null,
                "repository_name": "ishi",
                "user_name": "ku-nlp",
                "description": "Ishi: A volition classifier for Japanese",
                "multilingual_descriptions": {
                    "en": "Ishi: A volition classifier for Japanese",
                    "ja": "石：日本語の意志分類器",
                    "zh-hans": "石：日语意愿分类器",
                    "zh-hant": "石：日語意志分類器"
                }
            },
            "https://github.com/musyoku/python-npylm": {
                "sub_category": null,
                "repository_name": "python-npylm",
                "user_name": "musyoku",
                "description": "ベイズ階層言語モデルによる教師なし形態素解析",
                "multilingual_descriptions": {
                    "en": "Unsupervised morphological analysis using a Bayesian hierarchical language model.",
                    "ja": "ベイズ階層言語モデルによる教師なし形態素解析",
                    "zh-hans": "基于贝叶斯层次语言模型的无监督形态素分析。",
                    "zh-hant": "利用貝葉斯階層語言模型進行無監督詞素分析"
                }
            },
            "https://github.com/musyoku/python-npycrf": {
                "sub_category": null,
                "repository_name": "python-npycrf",
                "user_name": "musyoku",
                "description": "条件付確率場とベイズ階層言語モデルの統合による半教師あり形態素解析",
                "multilingual_descriptions": {
                    "en": "Semi-supervised morphological analysis through integration of conditional probability fields and Bayesian hierarchical language models.",
                    "ja": "条件付確率場とベイズ階層言語モデルの統合による半教師あり形態素解析",
                    "zh-hans": "通过条件付概率场和贝叶斯层次语言模型的整合实现半监督形态分析。",
                    "zh-hant": "條件付機率場和貝葉斯階層語言模型的整合，實現半監督形態素分析。"
                }
            },
            "https://github.com/musyoku/unsupervised-pos-tagging": {
                "sub_category": null,
                "repository_name": "unsupervised-pos-tagging",
                "user_name": "musyoku",
                "description": "教師なし品詞タグ推定",
                "multilingual_descriptions": {
                    "en": "Part-of-speech tagging without a teacher",
                    "ja": "教師なし品詞タグ推定",
                    "zh-hans": "无教师词性标注推测",
                    "zh-hant": "教師無品詞標記推斷"
                }
            },
            "https://github.com/cocodrips/negima": {
                "sub_category": null,
                "repository_name": "negima",
                "user_name": "cocodrips",
                "description": "Negima is a Python package to extract phrases in Japanese text by using the part-of-speeches based rules you defined.",
                "multilingual_descriptions": {
                    "en": "Negima is a Python package to extract phrases in Japanese text by using the part-of-speeches based rules you defined.",
                    "ja": "Negimaは、定義した品詞ベースのルールを使用して、日本語テキストからフレーズを抽出するためのPythonパッケージです。",
                    "zh-hans": "Negima是一个Python包，可以通过使用您定义的基于词性的规则来提取日语文本中的短语。",
                    "zh-hant": "Negima是一個Python套件，可以通過使用您定義的基於詞性的規則來提取日文文本中的短語。"
                }
            },
            "https://github.com/neilctwu/YouyakuMan": {
                "sub_category": null,
                "repository_name": "YouyakuMan",
                "user_name": "neilctwu",
                "description": "Extractive summarizer using BertSum as summarization model",
                "multilingual_descriptions": {
                    "en": "Extractive summarizer using BertSum as summarization model",
                    "ja": "BertSumを要約モデルとして使用する抽出型要約器",
                    "zh-hans": "使用BertSum作为摘要模型的提取式摘要器",
                    "zh-hant": "使用BertSum作為摘要模型的提取式摘要器"
                }
            },
            "https://github.com/takumakanari/japanese-numbers-python": {
                "sub_category": null,
                "repository_name": "japanese-numbers-python",
                "user_name": "takumakanari",
                "description": "A parser for Japanese number (Kanji, arabic) in the natural language.",
                "multilingual_descriptions": {
                    "en": "A parser for Japanese number (Kanji, arabic) in the natural language.",
                    "ja": "自然言語での日本語数字（漢字、アラビア数字）のパーサー。",
                    "zh-hans": "一个自然语言中的日语数字（汉字、阿拉伯数字）解析器。",
                    "zh-hant": "一個自然語言中的日本數字（漢字、阿拉伯數字）解析器。"
                }
            },
            "https://github.com/itayperl/kantan": {
                "sub_category": null,
                "repository_name": "kantan",
                "user_name": "itayperl",
                "description": "Lookup japanese words by radical patterns",
                "multilingual_descriptions": {
                    "en": "Lookup japanese words by radical patterns",
                    "ja": "部首のパターンで日本語の単語を検索する",
                    "zh-hans": "按部首查找日语单词",
                    "zh-hant": "按部首模式查找日語單詞"
                }
            },
            "https://github.com/knok/make-meidai-dialogue": {
                "sub_category": null,
                "repository_name": "make-meidai-dialogue",
                "user_name": "knok",
                "description": "Get Japanese dialogue corpus",
                "multilingual_descriptions": {
                    "en": "Obtain a corpus of Japanese dialogue.",
                    "ja": "日本語の会話コーパスを取得する。",
                    "zh-hans": "获取日语对话语料库",
                    "zh-hant": "獲取日語對話語料庫"
                }
            },
            "https://github.com/ryuryukke/japanese_summarizer": {
                "sub_category": null,
                "repository_name": "japanese_summarizer",
                "user_name": "ryuryukke",
                "description": "A summarizer for Japanese articles.",
                "multilingual_descriptions": {
                    "en": "A summarizer for Japanese articles.",
                    "ja": "日本語記事の要約ツール。",
                    "zh-hans": "日本文章摘要器。",
                    "zh-hant": "日本文章摘要器。"
                }
            },
            "https://github.com/letuananh/chirptext": {
                "sub_category": null,
                "repository_name": "chirptext",
                "user_name": "letuananh",
                "description": "ChirpText is a collection of text processing tools for Python.",
                "multilingual_descriptions": {
                    "en": "ChirpText is a collection of text processing tools for Python.",
                    "ja": "ChirpTextはPythonのテキスト処理ツールのコレクションです。",
                    "zh-hans": "ChirpText是Python的文本处理工具集合。",
                    "zh-hant": "ChirpText 是一個針對 Python 的文本處理工具集合。"
                }
            },
            "https://github.com/alvations/yubin": {
                "sub_category": null,
                "repository_name": "yubin",
                "user_name": "alvations",
                "description": "Japanese Address Munger",
                "multilingual_descriptions": {
                    "en": "日本の住所マンガー",
                    "ja": "日本の住所マンガー",
                    "zh-hans": "日本地址Munger",
                    "zh-hant": "日本地址 Munger"
                }
            },
            "https://github.com/hppRC/jawiki-cleaner": {
                "sub_category": null,
                "repository_name": "jawiki-cleaner",
                "user_name": "hppRC",
                "description": "Japanese Wikipedia Cleaner",
                "multilingual_descriptions": {
                    "en": "Japanese Wikipedia Cleaner",
                    "ja": "日本語ウィキペディアクリーナー",
                    "zh-hans": "日语维基百科清理工具",
                    "zh-hant": "日本維基百科清潔工具"
                }
            },
            "https://github.com/iory/japanese2phoneme": {
                "sub_category": null,
                "repository_name": "japanese2phoneme",
                "user_name": "iory",
                "description": "A python library to convert Japanese to phoneme.",
                "multilingual_descriptions": {
                    "en": "A python library to convert Japanese to phoneme.",
                    "ja": "日本語を音素に変換するためのPythonライブラリ。",
                    "zh-hans": "一个将日语转换为音素的Python库。",
                    "zh-hant": "一個將日文轉換為音素的Python庫。"
                }
            },
            "https://github.com/arusl/anlp_nlp2021_d3-1": {
                "sub_category": null,
                "repository_name": "anlp_nlp2021_d3-1",
                "user_name": "arusl",
                "description": "This repository contains codes related to the experiments in \"An Experimental Evaluation of Japanese Tokenizers for Sentiment-Based Text Classification\"",
                "multilingual_descriptions": {
                    "en": "This repository contains codes related to the experiments in \"An Experimental Evaluation of Japanese Tokenizers for Sentiment-Based Text Classification\"",
                    "ja": "このリポジトリには、「感情に基づくテキスト分類のための日本語トークナイザーの実験的評価」に関連するコードが含まれています。",
                    "zh-hans": "这个代码库包含与“基于情感的文本分类的日语分词器的实验评估”相关的代码。",
                    "zh-hant": "這個存儲庫包含與“基於情感的文本分類的日語分詞器的實驗評估”相關的代碼。"
                }
            },
            "https://github.com/shibuiwilliam/aozora_classification": {
                "sub_category": null,
                "repository_name": "aozora_classification",
                "user_name": "shibuiwilliam",
                "description": "About",
                "multilingual_descriptions": {
                    "en": "About",
                    "ja": "約について",
                    "zh-hans": "关于",
                    "zh-hant": "關於"
                }
            },
            "https://github.com/borh/aozora-corpus-generator": {
                "sub_category": null,
                "repository_name": "aozora-corpus-generator",
                "user_name": "borh",
                "description": "Generates plain or tokenized text files from the Aozora Bunko",
                "multilingual_descriptions": {
                    "en": "Generates plain or tokenized text files from the Aozora Bunko",
                    "ja": "青空文庫からプレーンテキストまたはトークン化されたテキストファイルを生成します。",
                    "zh-hans": "从青空文库生成纯文本或标记化文本文件。",
                    "zh-hant": "從青空文庫生成純文本或標記化文本文件"
                }
            },
            "https://github.com/jiali-ms/JLM": {
                "sub_category": null,
                "repository_name": "JLM",
                "user_name": "jiali-ms",
                "description": "A fast LSTM Language Model for large vocabulary language like Japanese and Chinese",
                "multilingual_descriptions": {
                    "en": "A fast LSTM Language Model for large vocabulary language like Japanese and Chinese",
                    "ja": "日本語や中国語のような大語彙言語に対応した高速なLSTM言語モデル",
                    "zh-hans": "一个快速的LSTM语言模型，适用于日语和中文等大词汇语言。",
                    "zh-hant": "一個快速的LSTM語言模型，適用於日語和中文等大詞彙語言。"
                }
            },
            "https://github.com/m3yrin/NTM": {
                "sub_category": null,
                "repository_name": "NTM",
                "user_name": "m3yrin",
                "description": "Testing of Neural Topic Modeling for Japanese articles",
                "multilingual_descriptions": {
                    "en": "Testing of Neural Topic Modeling for Japanese articles",
                    "ja": "日本語記事のニューラルトピックモデリングのテスト",
                    "zh-hans": "日本文章的神经主题建模测试",
                    "zh-hant": "日本文章的神經主題建模測試"
                }
            },
            "https://github.com/Machine-Learning-Tokyo/EN-JP-ML-Lexicon": {
                "sub_category": null,
                "repository_name": "EN-JP-ML-Lexicon",
                "user_name": "Machine-Learning-Tokyo",
                "description": "This is a English-Japanese lexicon for Machine Learning and Deep Learning terminology.",
                "multilingual_descriptions": {
                    "en": "This is a English-Japanese lexicon for Machine Learning and Deep Learning terminology.",
                    "ja": "これは、機械学習とディープラーニングの用語に関する英日語辞典です。",
                    "zh-hans": "这是一个英日机器学习和深度学习术语词典。",
                    "zh-hant": "這是一個機器學習和深度學習術語的英日詞彙表。"
                }
            },
            "https://github.com/discus0434/text-generation": {
                "sub_category": null,
                "repository_name": "text-generation",
                "user_name": "discus0434",
                "description": "Easy-to-use scripts to fine-tune GPT-2-JA with your own texts, to generate sentences, and to tweet them automatically.",
                "multilingual_descriptions": {
                    "en": "Easy-to-use scripts to fine-tune GPT-2-JA with your own texts, to generate sentences, and to tweet them automatically.",
                    "ja": "あなた自身のテキストでGPT-2-JAを微調整し、文章を生成し、自動的にツイートするための使いやすいスクリプト。",
                    "zh-hans": "易于使用的脚本，可通过您自己的文本对GPT-2-JA进行微调，生成句子并自动发布推文。",
                    "zh-hant": "易於使用的腳本，可調整GPT-2-JA與您自己的文本，生成句子並自動發推文。"
                }
            },
            "https://github.com/yuyay/chainer_nic": {
                "sub_category": null,
                "repository_name": "chainer_nic",
                "user_name": "yuyay",
                "description": "Neural Image Caption (NIC) on chainer, its pretrained models on English and Japanese image caption datasets.",
                "multilingual_descriptions": {
                    "en": "Neural Image Caption (NIC) on chainer, its pretrained models on English and Japanese image caption datasets.",
                    "ja": "Chainer上のニューラル画像キャプション（NIC）、英語と日本語の画像キャプションデータセットの事前学習済みモデル。",
                    "zh-hans": "神经图像描述（NIC）在Chainer上的预训练模型，其英语和日语图像描述数据集的预训练模型。",
                    "zh-hant": "在Chainer上的神經圖像標題（NIC），其預訓練模型適用於英語和日語圖像標題數據集。"
                }
            },
            "https://github.com/JetRunner/unihan-lm": {
                "sub_category": null,
                "repository_name": "unihan-lm",
                "user_name": "JetRunner",
                "description": "The official repository for \"UnihanLM: Coarse-to-Fine Chinese-Japanese Language Model Pretraining with the Unihan Database\", AACL-IJCNLP 2020",
                "multilingual_descriptions": {
                    "en": "The official repository for \"UnihanLM: Coarse-to-Fine Chinese-Japanese Language Model Pretraining with the Unihan Database\", AACL-IJCNLP 2020",
                    "ja": "「UnihanLM：Unihanデータベースを用いた粗-細分割の中国語-日本語言語モデル事前学習」の公式リポジトリ、AACL-IJCNLP 2020",
                    "zh-hans": "“UnihanLM: 基于Unihan数据库的中日语言模型预训练的官方代码库”，AACL-IJCNLP 2020",
                    "zh-hant": "「UnihanLM：使用Unihan數據庫進行粗到細的中日語言模型預訓練」的官方存儲庫，AACL-IJCNLP 2020"
                }
            },
            "https://github.com/ken11/mbart-finetuning": {
                "sub_category": null,
                "repository_name": "mbart-finetuning",
                "user_name": "ken11",
                "description": "Code to perform finetuning of the mBART model.",
                "multilingual_descriptions": {
                    "en": "Code to perform finetuning of the mBART model.",
                    "ja": "mBARTモデルのファインチューニングを実行するためのコード。",
                    "zh-hans": "用于微调mBART模型的代码。",
                    "zh-hant": "執行 mBART 模型微調的程式碼。"
                }
            },
            "https://github.com/sarulab-speech/xvector_jtubespeech": {
                "sub_category": null,
                "repository_name": "xvector_jtubespeech",
                "user_name": "sarulab-speech",
                "description": "xvector model on jtubespeech",
                "multilingual_descriptions": {
                    "en": "Model xvector on jtubespeech.",
                    "ja": "jtubespeech上のxvectorモデル",
                    "zh-hans": "在jtubespeech上的xvector模型",
                    "zh-hant": "在jtubespeech上的xvector模型"
                }
            },
            "https://github.com/shogo82148/TinySegmenterMaker": {
                "sub_category": null,
                "repository_name": "TinySegmenterMaker",
                "user_name": "shogo82148",
                "description": "TinySegmenter用の学習モデルを自作するためのツール．",
                "multilingual_descriptions": {
                    "en": "A tool for creating a custom learning model for TinySegmenter.",
                    "ja": "TinySegmenter用の学習モデルを自作するためのツール．",
                    "zh-hans": "用于创建TinySegmenter学习模型的工具。",
                    "zh-hant": "自製TinySegmenter學習模型的工具。"
                }
            },
            "https://github.com/shogo82148/Grongish": {
                "sub_category": null,
                "repository_name": "Grongish",
                "user_name": "shogo82148",
                "description": "日本語とグロンギ語の相互変換スクリプト",
                "multilingual_descriptions": {
                    "en": "Script for mutual conversion between Japanese and Gurongi language.",
                    "ja": "日本語とグロンギ語の相互変換スクリプト",
                    "zh-hans": "日语和格龙基语的相互转换脚本",
                    "zh-hant": "日本語和格隆基語的相互轉換腳本"
                }
            },
            "https://github.com/aocattleya/WordCloud-Japanese": {
                "sub_category": null,
                "repository_name": "WordCloud-Japanese",
                "user_name": "aocattleya",
                "description": "WordCloudでの日本語文章をMecab（形態素解析エンジン）を使用せずに形態素解析チックな表示を実現するスクリプト",
                "multilingual_descriptions": {
                    "en": "A script that enables morphological analysis-like display of Japanese sentences in WordCloud without using Mecab (a morphological analysis engine).",
                    "ja": "WordCloudでの日本語文章をMecab（形態素解析エンジン）を使用せずに形態素解析チックな表示を実現するスクリプト",
                    "zh-hans": "使用WordCloud生成的日语文章，无需使用Mecab（形态素解析引擎），即可实现形态素解析式的显示脚本。",
                    "zh-hant": "使用WordCloud製作日文文章的腳本，實現形態素解析式的顯示，不需使用Mecab（形態素解析引擎）。"
                }
            },
            "https://github.com/hiraokusky/snark": {
                "sub_category": null,
                "repository_name": "snark",
                "user_name": "hiraokusky",
                "description": "日本語ワードネットを利用したDBアクセスライブラリ",
                "multilingual_descriptions": {
                    "en": "DB access library using Japanese WordNet",
                    "ja": "日本語ワードネットを利用したDBアクセスライブラリ",
                    "zh-hans": "使用日语WordNet的DB访问库",
                    "zh-hant": "利用日本語詞彙網路的資料庫存取程式庫"
                }
            },
            "https://github.com/mkan0141/toEmoji": {
                "sub_category": null,
                "repository_name": "toEmoji",
                "user_name": "mkan0141",
                "description": "日本語文を絵文字だけの文に変換するなにか",
                "multilingual_descriptions": {
                    "en": "Something that converts Japanese sentences into sentences made up of only emojis.",
                    "ja": "日本語文を絵文字だけの文に変換するなにか",
                    "zh-hans": "将日语文本转换为仅包含表情符号的文本的工具",
                    "zh-hant": "將日文轉換為僅由表情符號組成的文本的工具"
                }
            },
            "https://github.com/kanjirz50/termextract": {
                "sub_category": null,
                "repository_name": "termextract",
                "user_name": "kanjirz50",
                "description": "専門用語抽出アルゴリズムの実装の練習",
                "multilingual_descriptions": {
                    "en": "Practice implementing a specialized terminology extraction algorithm.",
                    "ja": "- 専門用語抽出アルゴリズムの実装の練習",
                    "zh-hans": "- 专业术语抽取算法的实现练习",
                    "zh-hant": "- 專門用語抽出演算法的實現練習"
                }
            },
            "https://github.com/TUT-SLP-lab/JDT-with-KenLM-scoring": {
                "sub_category": null,
                "repository_name": "JDT-with-KenLM-scoring",
                "user_name": "TUT-SLP-lab",
                "description": "Japanese-Dialog-Transformerの応答候補に対して、KenLMによるN-gram言語モデルでスコアリングし、フィルタリング若しくはリランキングを行う。",
                "multilingual_descriptions": {
                    "en": "Scoring is performed using an N-gram language model by KenLM on response candidates from Japanese-Dialog-Transformer, followed by filtering or re-ranking.",
                    "ja": "Japanese-Dialog-Transformerの応答候補に対して、KenLMによるN-gram言語モデルでスコアリングし、フィルタリング若しくはリランキングを行う。",
                    "zh-hans": "对于Japanese-Dialog-Transformer的响应候选，使用KenLM的N-gram语言模型进行评分，进行过滤或重新排序。",
                    "zh-hant": "對於Japanese-Dialog-Transformer的回應候選，使用KenLM的N-gram語言模型進行評分，進行過濾或重新排序。"
                }
            },
            "https://github.com/KentoW/mixture-of-unigram-model": {
                "sub_category": null,
                "repository_name": "mixture-of-unigram-model",
                "user_name": "KentoW",
                "description": "Mixture of Unigram Model and Infinite Mixture of Unigram Model in Python. (混合ユニグラムモデルと無限混合ユニグラムモデル)",
                "multilingual_descriptions": {
                    "en": "Mixture of Unigram Model and Infinite Mixture of Unigram Model in Python. (混合ユニグラムモデルと無限混合ユニグラムモデル)",
                    "ja": "Pythonにおける混合ユニグラムモデルと無限混合ユニグラムモデルの組み合わせ。",
                    "zh-hans": "Python中的混合Unigram模型和无限混合Unigram模型。",
                    "zh-hant": "Python中的混合Unigram模型和无限混合Unigram模型。 (混合單詞模型和無限混合單詞模型在Python中。)"
                }
            },
            "https://github.com/KentoW/hidden-markov-model": {
                "sub_category": null,
                "repository_name": "hidden-markov-model",
                "user_name": "KentoW",
                "description": "Hidden Markov Model (HMM) and Infinite Hidden Markov Model (iHMM) in Python. (隠れマルコフモデルと無限隠れマルコフモデル)",
                "multilingual_descriptions": {
                    "en": "隠れマルコフモデル (Hidden Markov Model, HMM) and 無限隠れマルコフモデル (Infinite Hidden Markov Model, iHMM) in Python.",
                    "ja": "Pythonにおける隠れマルコフモデル（HMM）と無限隠れマルコフモデル（iHMM）。",
                    "zh-hans": "Python中的隐马尔可夫模型（HMM）和无限隐马尔可夫模型（iHMM）。",
                    "zh-hant": "Python中的隱藏馬可夫模型（HMM）和無限隱藏馬可夫模型（iHMM）。"
                }
            },
            "https://github.com/KentoW/Ngram-language-model": {
                "sub_category": null,
                "repository_name": "Ngram-language-model",
                "user_name": "KentoW",
                "description": "Ngram language model in Python. (Nグラム言語モデル)",
                "multilingual_descriptions": {
                    "en": "Ngram language model in Python. (Nグラム言語モデル)",
                    "ja": "PythonにおけるNグラム言語モデル。",
                    "zh-hans": "Python中的Ngram语言模型。",
                    "zh-hant": "Python中的Ngram語言模型。 (N-gram語言模型)"
                }
            },
            "https://github.com/JeanMaximilienCadic/ASRDeepSpeech": {
                "sub_category": null,
                "repository_name": "ASRDeepSpeech",
                "user_name": "JeanMaximilienCadic",
                "description": "Automatic Speech Recognition with deepspeech2 model in pytorch with support from Zakuro AI.",
                "multilingual_descriptions": {
                    "en": "Automatic Speech Recognition with deepspeech2 model in pytorch with support from Zakuro AI.",
                    "ja": "自動音声認識は、Zakuro AIのサポートを受けたpytorchのdeepspeech2モデルを使用しています。",
                    "zh-hans": "使用PyTorch中的deepspeech2模型和Zakuro AI的支持进行自动语音识别。",
                    "zh-hant": "使用PyTorch中的deepspeech2模型和Zakuro AI的支援進行自動語音識別。"
                }
            },
            "https://github.com/yohokuno/neural_ime": {
                "sub_category": null,
                "repository_name": "neural_ime",
                "user_name": "yohokuno",
                "description": "Neural IME: Neural Input Method Engine",
                "multilingual_descriptions": {
                    "en": "Neural IME: Neural Input Method Engine",
                    "ja": "ニューラルIME：ニューラル入力方式エンジン",
                    "zh-hans": "神经输入法引擎：神经输入法引擎",
                    "zh-hant": "神經輸入法引擎：神經輸入法引擎"
                }
            },
            "https://github.com/Kyubyong/neural_japanese_transliterator": {
                "sub_category": null,
                "repository_name": "neural_japanese_transliterator",
                "user_name": "Kyubyong",
                "description": "Can neural networks transliterate Romaji into Japanese correctly?",
                "multilingual_descriptions": {
                    "en": "Can neural networks transliterate Romaji into Japanese correctly?",
                    "ja": "ニューラルネットワークはローマ字を正しく日本語に転写できますか？",
                    "zh-hans": "神经网络能正确地将罗马字转写成日语吗？",
                    "zh-hant": "神經網路能正確地將羅馬字轉寫成日文嗎？"
                }
            },
            "https://github.com/SamuraiT/tinysegmenter": {
                "sub_category": null,
                "repository_name": "tinysegmenter",
                "user_name": "SamuraiT",
                "description": "tokenizer specified for Japanese",
                "multilingual_descriptions": {
                    "en": "tokenizer specified for Japanese",
                    "ja": "日本語用のトークナイザーが指定されました。",
                    "zh-hans": "为日语指定的分词器",
                    "zh-hant": "針對日語指定的分詞器"
                }
            },
            "https://github.com/chck/AugLy-jp": {
                "sub_category": null,
                "repository_name": "AugLy-jp",
                "user_name": "chck",
                "description": "Data Augmentation for Japanese Text on AugLy",
                "multilingual_descriptions": {
                    "en": "Data Augmentation for Japanese Text on AugLy",
                    "ja": "AugLyにおける日本語テキストのデータ拡張",
                    "zh-hans": "AugLy上的日语文本数据增强",
                    "zh-hant": "在AugLy上進行日文文本的數據增強"
                }
            },
            "https://github.com/Mumumu4/furigana4epub": {
                "sub_category": null,
                "repository_name": "furigana4epub",
                "user_name": "Mumumu4",
                "description": "A Python script for adding furigana to Japanese epub books using Mecab and Unidic.",
                "multilingual_descriptions": {
                    "en": "A Python script for adding furigana to Japanese epub books using Mecab and Unidic.",
                    "ja": "MecabとUnidicを使用して日本語のepub書籍にフリガナを追加するためのPythonスクリプト。",
                    "zh-hans": "一个使用Mecab和Unidic为日语epub书籍添加振仮名的Python脚本。",
                    "zh-hant": "一個使用Mecab和Unidic將振仮名添加到日語epub書籍的Python腳本。"
                }
            },
            "https://github.com/SmashinFries/PyKatsuyou": {
                "sub_category": null,
                "repository_name": "PyKatsuyou",
                "user_name": "SmashinFries",
                "description": "Japanese verb/adjective inflections tool",
                "multilingual_descriptions": {
                    "en": "Japanese verb/adjective inflections tool",
                    "ja": "日本語の動詞/形容詞の活用ツール",
                    "zh-hans": "日语动词/形容词变形工具",
                    "zh-hant": "日語動詞/形容詞變化工具"
                }
            },
            "https://github.com/t-sagara/jageocoder": {
                "sub_category": null,
                "repository_name": "jageocoder",
                "user_name": "t-sagara",
                "description": "Pure Python Japanese address geocoder",
                "multilingual_descriptions": {
                    "en": "Pure Python Japanese address geocoder",
                    "ja": "純粋なPythonの日本の住所ジオコーダー",
                    "zh-hans": "纯Python日本地址地理编码器",
                    "zh-hant": "純Python日本地址地理編碼器"
                }
            },
            "https://github.com/yoriyuki/nksnd": {
                "sub_category": null,
                "repository_name": "nksnd",
                "user_name": "yoriyuki",
                "description": "New kana-kanji conversion engine",
                "multilingual_descriptions": {
                    "en": "新しい仮名漢字変換エンジン",
                    "ja": "新しいかな漢字変換エンジン",
                    "zh-hans": "新的假名汉字转换引擎",
                    "zh-hant": "新的假名漢字轉換引擎"
                }
            },
            "https://github.com/racerandom/JaMIE": {
                "sub_category": null,
                "repository_name": "JaMIE",
                "user_name": "racerandom",
                "description": "A Japanese Medical Information Extraction Toolkit",
                "multilingual_descriptions": {
                    "en": "A Japanese Medical Information Extraction Toolkit",
                    "ja": "日本語医療情報抽出ツールキット",
                    "zh-hans": "一个日本医疗信息提取工具包",
                    "zh-hant": "一個日本醫學信息提取工具箱"
                }
            },
            "https://github.com/GINK03/fasttext-vs-word2vec-on-twitter-data": {
                "sub_category": null,
                "repository_name": "fasttext-vs-word2vec-on-twitter-data",
                "user_name": "GINK03",
                "description": "fasttextとword2vecの比較と、実行スクリプト、学習スクリプトです",
                "multilingual_descriptions": {
                    "en": "This is a comparison between fasttext and word2vec, as well as execution and learning scripts.",
                    "ja": "fasttextとword2vecの比較と、実行スクリプト、学習スクリプトです",
                    "zh-hans": "这是有关fasttext和word2vec的比较，以及执行脚本和学习脚本。",
                    "zh-hant": "這是有關 fasttext 和 word2vec 的比較，以及執行腳本和學習腳本。"
                }
            },
            "https://github.com/GINK03/minimal-search-engine": {
                "sub_category": null,
                "repository_name": "minimal-search-engine",
                "user_name": "GINK03",
                "description": "最小のサーチエンジン/PageRank/tf-idf",
                "multilingual_descriptions": {
                    "en": "Smallest search engine/PageRank/tf-idf",
                    "ja": "最小のサーチエンジン/PageRank/tf-idf",
                    "zh-hans": "最小的搜索引擎/PageRank/tf-idf",
                    "zh-hant": "最小的搜尋引擎/PageRank/tf-idf"
                }
            },
            "https://github.com/GINK03/5ch-analysis": {
                "sub_category": null,
                "repository_name": "5ch-analysis",
                "user_name": "GINK03",
                "description": "5chの過去ログをスクレイピングして、過去流行った単語(ex, 香具師, orz)などを追跡調査",
                "multilingual_descriptions": {
                    "en": "Scraping past logs from 5ch and conducting tracking investigations on words that were popular in the past (e.g. kagutsushi, orz).",
                    "ja": "5chの過去ログをスクレイピングして、過去流行った単語(ex, 香具師, orz)などを追跡調査",
                    "zh-hans": "通过网络爬虫获取5ch的历史记录，跟踪调查过去流行的词语（例如，香具师，orz）等。",
                    "zh-hant": "利用網路爬蟲技術，對5ch的歷史紀錄進行擷取，追蹤調查過去流行的詞語（例如：香具師、orz等）。"
                }
            },
            "https://github.com/tatHi/tweet_extructor": {
                "sub_category": null,
                "repository_name": "tweet_extructor",
                "user_name": "tatHi",
                "description": "Twitter日本語評判分析データセットのためのツイートダウンローダ",
                "multilingual_descriptions": {
                    "en": "Tweet downloader for Japanese sentiment analysis dataset on Twitter.",
                    "ja": "Twitter日本語評判分析データセットのためのツイートダウンローダ",
                    "zh-hans": "用于Twitter日语评价分析数据集的推文下载器",
                    "zh-hant": "Twitter日語評價分析資料集的推文下載器"
                }
            },
            "https://github.com/hkiyomaru/japanese-word-aggregation": {
                "sub_category": null,
                "repository_name": "japanese-word-aggregation",
                "user_name": "hkiyomaru",
                "description": "Aggregating Japanese words based on Juman++ and ConceptNet5.5",
                "multilingual_descriptions": {
                    "en": "Aggregating Japanese words based on Juman++ and ConceptNet5.5",
                    "ja": "Juman++とConceptNet5.5に基づいて日本語の単語を集約する。",
                    "zh-hans": "基于Juman++和ConceptNet5.5聚合日语单词。",
                    "zh-hant": "基於Juman++和ConceptNet5.5的日語詞匯聚合"
                }
            },
            "https://github.com/hkiyomaru/jinf": {
                "sub_category": null,
                "repository_name": "jinf",
                "user_name": "hkiyomaru",
                "description": "A Japanese inflection converter",
                "multilingual_descriptions": {
                    "en": "A Japanese inflection converter",
                    "ja": "日本語活用変換ツール",
                    "zh-hans": "一个日语变形转换器",
                    "zh-hant": "一個日語變化轉換器"
                }
            },
            "https://github.com/ku-nlp/kwja": {
                "sub_category": null,
                "repository_name": "kwja",
                "user_name": "ku-nlp",
                "description": "A unified language analyzer for Japanese",
                "multilingual_descriptions": {
                    "en": "A unified language analyzer for Japanese",
                    "ja": "日本語の統一された言語解析器",
                    "zh-hans": "一个用于日语的统一语言分析器",
                    "zh-hant": "一個統一的日語語言分析器"
                }
            },
            "https://github.com/Ryutaro-A/mlm-scoring-transformers": {
                "sub_category": null,
                "repository_name": "mlm-scoring-transformers",
                "user_name": "Ryutaro-A",
                "description": "Reproduced package based on Masked Language Model Scoring (ACL2020).",
                "multilingual_descriptions": {
                    "en": "Reproduced package based on Masked Language Model Scoring (ACL2020).",
                    "ja": "マスクされた言語モデルスコアリングに基づく再現パッケージ（ACL2020）。",
                    "zh-hans": "基于掩码语言模型评分的复制包（ACL2020）。",
                    "zh-hant": "基於遮蔽語言模型評分的複製套件（ACL2020）。"
                }
            },
            "https://github.com/Japanese-Image-Captioning/ClipCap-for-Japanese": {
                "sub_category": null,
                "repository_name": "ClipCap-for-Japanese",
                "user_name": "Japanese-Image-Captioning",
                "description": "[PyTorch] ClipCap for Japanese",
                "multilingual_descriptions": {
                    "en": "[PyTorch] ClipCap for Japanese",
                    "ja": "[PyTorch] 日本語のClipCap",
                    "zh-hans": "[PyTorch] 日语ClipCap",
                    "zh-hant": "[PyTorch] 日語 ClipCap"
                }
            },
            "https://github.com/Japanese-Image-Captioning/SAT-for-Japanese": {
                "sub_category": null,
                "repository_name": "SAT-for-Japanese",
                "user_name": "Japanese-Image-Captioning",
                "description": "[PyTorch] Show, Attend and Tell for Japanese",
                "multilingual_descriptions": {
                    "en": "[PyTorch] Show, Attend and Tell for Japanese",
                    "ja": "[PyTorch] 日本語のための Show, Attend and Tell",
                    "zh-hans": "[PyTorch] 展示、关注和讲述日语",
                    "zh-hant": "[PyTorch] 展示、關注和講述日語"
                }
            },
            "https://github.com/cihai/cihai": {
                "sub_category": null,
                "repository_name": "cihai",
                "user_name": "cihai",
                "description": "Python library for CJK (Chinese, Japanese, and Korean) language dictionary",
                "multilingual_descriptions": {
                    "en": "Python library for CJK (Chinese, Japanese, and Korean) language dictionary",
                    "ja": "CJK（中国語、日本語、韓国語）言語辞書のためのPythonライブラリ",
                    "zh-hans": "Python CJK（中文、日文、韩文）语言字典库",
                    "zh-hant": "Python CJK（中文、日文、韓文）語言字典庫"
                }
            },
            "https://github.com/6gsn/marine": {
                "sub_category": null,
                "repository_name": "marine",
                "user_name": "6gsn",
                "description": "MARINE : Multi-task leaRnIng-based JapaNese accent Estimation",
                "multilingual_descriptions": {
                    "en": "MARINE : Multi-task leaRnIng-based JapaNese accent Estimation",
                    "ja": "MARINE：マルチタスク学習に基づく日本語アクセント推定",
                    "zh-hans": "MARINE：基于多任务学习的日语口音估计",
                    "zh-hant": "MARINE：基於多任務學習的日語口音估計"
                }
            },
            "https://github.com/sarulab-speech/whisper-asr-finetune": {
                "sub_category": null,
                "repository_name": "whisper-asr-finetune",
                "user_name": "sarulab-speech",
                "description": "Finetuning Whisper ASR model",
                "multilingual_descriptions": {
                    "en": "Fine-tuning the Whisper ASR model.",
                    "ja": "Whisper ASRモデルの微調整",
                    "zh-hans": "微调Whisper ASR模型",
                    "zh-hant": "微調Whisper ASR模型"
                }
            },
            "https://github.com/CjangCjengh/japanese_chatbot": {
                "sub_category": null,
                "repository_name": "japanese_chatbot",
                "user_name": "CjangCjengh",
                "description": "A PyTorch Implementation of japanese chatbot using BERT and Transformer's decoder",
                "multilingual_descriptions": {
                    "en": "A PyTorch Implementation of japanese chatbot using BERT and Transformer's decoder",
                    "ja": "BERTとTransformerのデコーダーを使用した日本語チャットボットのPyTorch実装",
                    "zh-hans": "使用BERT和Transformer解码器的日语聊天机器人的PyTorch实现",
                    "zh-hant": "使用BERT和Transformer解碼器的日語聊天機器人的PyTorch實現"
                }
            },
            "https://github.com/yamamaya/radicalchar": {
                "sub_category": null,
                "repository_name": "radicalchar",
                "user_name": "yamamaya",
                "description": "部首文字正規化ライブラリ",
                "multilingual_descriptions": {
                    "en": "Radical character normalization library",
                    "ja": "部首文字正規化ライブラリ",
                    "zh-hans": "部首文字规范化库",
                    "zh-hant": "部首文字正規化程式庫"
                }
            },
            "https://github.com/tokuhirom/akaza": {
                "sub_category": null,
                "repository_name": "akaza",
                "user_name": "tokuhirom",
                "description": "Yet another Japanese IME for IBus/Linux",
                "multilingual_descriptions": {
                    "en": "Yet another Japanese IME for IBus/Linux",
                    "ja": "IBus/Linux用のもう一つの日本語IME",
                    "zh-hans": "又一个适用于IBus/Linux的日语输入法",
                    "zh-hant": "又一個針對IBus/Linux的日文輸入法"
                }
            },
            "https://github.com/polm/posuto": {
                "sub_category": null,
                "repository_name": "posuto",
                "user_name": "polm",
                "description": "Japanese postal code data.",
                "multilingual_descriptions": {
                    "en": "日本の郵便番号データ。",
                    "ja": "日本の郵便番号データ。",
                    "zh-hans": "日本邮政编码数据。",
                    "zh-hant": "日本郵遞區號資料。"
                }
            },
            "https://github.com/CjangCjengh/tacotron2-japanese": {
                "sub_category": null,
                "repository_name": "tacotron2-japanese",
                "user_name": "CjangCjengh",
                "description": "Tacotron2 implementation of Japanese",
                "multilingual_descriptions": {
                    "en": "Tacotron2 implementation of Japanese",
                    "ja": "日本語のTacotron2の実装",
                    "zh-hans": "Tacotron2的日语实现",
                    "zh-hant": "Tacotron2 日語實現"
                }
            },
            "https://github.com/esrille/ibus-hiragana": {
                "sub_category": null,
                "repository_name": "ibus-hiragana",
                "user_name": "esrille",
                "description": "ひらがなIME for IBus",
                "multilingual_descriptions": {
                    "en": "Hiragana IME for IBus",
                    "ja": "ひらがなIME for IBus",
                    "zh-hans": "IBus平假名输入法",
                    "zh-hant": "IBus 平假名輸入法"
                }
            },
            "https://github.com/esrille/furiganapad": {
                "sub_category": null,
                "repository_name": "furiganapad",
                "user_name": "esrille",
                "description": "ふりがなパッド",
                "multilingual_descriptions": {
                    "en": "Furigana pad",
                    "ja": "ふりがなパッド",
                    "zh-hans": "假名垫",
                    "zh-hant": "注音輸入板"
                }
            },
            "https://github.com/WorksApplications/chikkarpy": {
                "sub_category": null,
                "repository_name": "chikkarpy",
                "user_name": "WorksApplications",
                "description": "Japanese synonym library",
                "multilingual_descriptions": {
                    "en": "Japanese synonym library",
                    "ja": "日本語類語辞書",
                    "zh-hans": "日语同义词库",
                    "zh-hant": "日語同義詞庫"
                }
            },
            "https://github.com/p-geon/ja-tokenizer-docker-py": {
                "sub_category": null,
                "repository_name": "ja-tokenizer-docker-py",
                "user_name": "p-geon",
                "description": "Mecab + NEologd + Docker + Python3",
                "multilingual_descriptions": {
                    "en": "Mecab + NEologd + Docker + Python3",
                    "ja": "Mecab + NEologd + Docker + Python3 の入力となります。",
                    "zh-hans": "Mecab + NEologd + Docker + Python3 的输出",
                    "zh-hant": "Mecab + NEologd + Docker + Python3\nMecab + NEologd + Docker + Python3"
                }
            },
            "https://github.com/oshizo/JapaneseEmbeddingEval": {
                "sub_category": null,
                "repository_name": "JapaneseEmbeddingEval",
                "user_name": "oshizo",
                "description": "JapaneseEmbeddingEval",
                "multilingual_descriptions": {
                    "en": "Japanese Embedding Evaluation",
                    "ja": "日本語埋め込み評価",
                    "zh-hans": "日语嵌入评估",
                    "zh-hant": "日本嵌入評估"
                }
            },
            "https://github.com/karakuri-ai/gptuber-by-langchain": {
                "sub_category": null,
                "repository_name": "gptuber-by-langchain",
                "user_name": "karakuri-ai",
                "description": "GPTがYouTuberをやります",
                "multilingual_descriptions": {
                    "en": "GPT will become a YouTuber.",
                    "ja": "GPTがYouTuberをやります",
                    "zh-hans": "GPT将成为YouTuber。",
                    "zh-hant": "GPT會當YouTuber"
                }
            },
            "https://github.com/google/shuwa": {
                "sub_category": null,
                "repository_name": "shuwa",
                "user_name": "google",
                "description": "Extend GNOME On-Screen Keyboard for Input Methods",
                "multilingual_descriptions": {
                    "en": "Extend GNOME On-Screen Keyboard for Input Methods",
                    "ja": "入力方法のためにGNOMEオンスクリーンキーボードを拡張する",
                    "zh-hans": "扩展GNOME屏幕键盘以支持输入法",
                    "zh-hant": "擴展 GNOME 螢幕鍵盤以支援輸入法"
                }
            },
            "https://github.com/CyberAgentAILab/japanese-nli-model": {
                "sub_category": null,
                "repository_name": "japanese-nli-model",
                "user_name": "CyberAgentAILab",
                "description": "This repository provides the code for Japanese NLI model, a fine-tuned masked language model.",
                "multilingual_descriptions": {
                    "en": "This repository provides the code for Japanese NLI model, a fine-tuned masked language model.",
                    "ja": "このリポジトリは、日本語NLIモデルのコードを提供しており、ファインチューニングされたマスク言語モデルです。",
                    "zh-hans": "这个代码库提供了日语NLI模型的代码，这是一个经过微调的掩码语言模型。",
                    "zh-hant": "這個存儲庫提供了日語NLI模型的代碼，一個經過微調的遮蔽語言模型。"
                }
            },
            "https://github.com/tos-kamiya/tra-fugu": {
                "sub_category": null,
                "repository_name": "tra-fugu",
                "user_name": "tos-kamiya",
                "description": "A tool for Japanese-English translation and English-Japanese translation by using FuguMT",
                "multilingual_descriptions": {
                    "en": "A tool for Japanese-English translation and English-Japanese translation by using FuguMT",
                    "ja": "FuguMTを使用した日本語-英語翻訳および英語-日本語翻訳のためのツール。",
                    "zh-hans": "使用FuguMT进行日英翻译和英日翻译的工具",
                    "zh-hant": "使用FuguMT進行日英翻譯和英日翻譯的工具"
                }
            },
            "https://github.com/s-taka/fugumt": {
                "sub_category": null,
                "repository_name": "fugumt",
                "user_name": "s-taka",
                "description": "ぷるーふおぶこんせぷと で公開した機械翻訳エンジンを利用する翻訳環境です。 フォームに入力された文字列の翻訳、PDFの翻訳が可能です。",
                "multilingual_descriptions": {
                    "en": "This is a translation environment that uses a machine translation engine released on the Blue Forest Concept website. It is capable of translating input text strings and PDF files through a form.",
                    "ja": "ぷるーふおぶこんせぷと で公開した機械翻訳エンジンを利用する翻訳環境です。 フォームに入力された文字列の翻訳、PDFの翻訳が可能です。",
                    "zh-hans": "这是一个使用在Plofile Hub Connect上公开的机器翻译引擎的翻译环境。可以翻译输入到表格中的字符串和PDF文件。",
                    "zh-hant": "這是一個使用在ぷるーふおぶこんせぷと上公開的機器翻譯引擎的翻譯環境。可以翻譯輸入在表格中的文字，以及 PDF 文件的翻譯。"
                }
            },
            "https://github.com/keio-smilab23/JaSPICE": {
                "sub_category": null,
                "repository_name": "JaSPICE",
                "user_name": "keio-smilab23",
                "description": "JaSPICE: Automatic Evaluation Metric Using Predicate-Argument Structures for Image Captioning Models",
                "multilingual_descriptions": {
                    "en": "JaSPICE: Automatic Evaluation Metric Using Predicate-Argument Structures for Image Captioning Models",
                    "ja": "JaSPICE：画像キャプショニングモデルの述語引数構造を使用した自動評価メトリック",
                    "zh-hans": "JaSPICE：使用谓词-论元结构自动评估图像字幕模型的评估指标",
                    "zh-hant": "JaSPICE：使用謂詞-參數結構自動評估圖像標題模型的評估指標"
                }
            },
            "https://github.com/yantaisa11/Retrieval-based-Voice-Conversion-WebUI-JP-localization": {
                "sub_category": null,
                "repository_name": "Retrieval-based-Voice-Conversion-WebUI-JP-localization",
                "user_name": "yantaisa11",
                "description": "jp-localization",
                "multilingual_descriptions": {
                    "en": "Japanese localization",
                    "ja": "日本語ローカライゼーション",
                    "zh-hans": "日本本地化",
                    "zh-hant": "日本本地化"
                }
            },
            "https://github.com/r9y9/pyopenjtalk": {
                "sub_category": null,
                "repository_name": "pyopenjtalk",
                "user_name": "r9y9",
                "description": "Python wrapper for OpenJTalk",
                "multilingual_descriptions": {
                    "en": "Python wrapper for OpenJTalk",
                    "ja": "OpenJTalkのPythonラッパー",
                    "zh-hans": "Python封装OpenJTalk",
                    "zh-hant": "Python 封裝 OpenJTalk"
                }
            },
            "https://github.com/rabbit19981023/yomigana-ebook": {
                "sub_category": null,
                "repository_name": "yomigana-ebook",
                "user_name": "rabbit19981023",
                "description": "Make learning Japanese easier by adding readings for every kanji in the eBook",
                "multilingual_descriptions": {
                    "en": "Make learning Japanese easier by adding readings for every kanji in the eBook",
                    "ja": "電子書籍に漢字の読み方を追加することで、日本語の学習をより簡単にすることができます。",
                    "zh-hans": "通过在电子书中为每个汉字添加读音，使学习日语更容易。",
                    "zh-hant": "在電子書中為每個漢字添加讀音，讓學習日語更容易。"
                }
            },
            "https://github.com/Ayanaminn/N46Whisper": {
                "sub_category": null,
                "repository_name": "N46Whisper",
                "user_name": "Ayanaminn",
                "description": "Whisper based Japanese subtitle generator",
                "multilingual_descriptions": {
                    "en": "Whisper based Japanese subtitle generator",
                    "ja": "ささやきベースの日本語字幕生成ツール",
                    "zh-hans": "基于耳语的日文字幕生成器",
                    "zh-hant": "基於耳語的日文字幕生成器"
                }
            },
            "https://github.com/noir55/japanese_llm_simple_webui": {
                "sub_category": null,
                "repository_name": "japanese_llm_simple_webui",
                "user_name": "noir55",
                "description": "Rinna-3.6B、OpenCALM等の日本語対応LLM(大規模言語モデル)用の簡易Webインタフェースです",
                "multilingual_descriptions": {
                    "en": "This is a simple web interface for Japanese compatible LLM (Large Language Model) such as Rinna-3.6B and OpenCALM.",
                    "ja": "Rinna-3.6B、OpenCALM等の日本語対応LLM(大規模言語モデル)用の簡易Webインタフェースです",
                    "zh-hans": "Rinna-3.6B、OpenCALM等是用于日语支持的大规模语言模型（LLM）的简易Web界面。",
                    "zh-hant": "Rinna-3.6B、OpenCALM等的日本語對應LLM(大規模言語模型)用的簡易Web介面是。"
                }
            },
            "https://github.com/discus0434/pdf-translator": {
                "sub_category": null,
                "repository_name": "pdf-translator",
                "user_name": "discus0434",
                "description": "pdf-translator translates English PDF files into Japanese, preserving the original layout.",
                "multilingual_descriptions": {
                    "en": "pdf-translator translates English PDF files into Japanese, preserving the original layout.",
                    "ja": "pdf-translatorは、英語のPDFファイルを日本語に翻訳し、元のレイアウトを保持します。",
                    "zh-hans": "pdf-translator将英文PDF文件翻译成日语，保留原始布局。",
                    "zh-hant": "pdf-translator 將英文 PDF 檔案翻譯成日文，並保留原始的版面配置。"
                }
            },
            "https://github.com/Shingo-Kamata/japanese_qa_demo_with_haystack_and_es": {
                "sub_category": null,
                "repository_name": "japanese_qa_demo_with_haystack_and_es",
                "user_name": "Shingo-Kamata",
                "description": "Haystack + Elasticsearch + wikipedia(ja) を用いた、日本語の質問応答システムのサンプル",
                "multilingual_descriptions": {
                    "en": "Haystack + Elasticsearch + wikipedia(ja) を用いた、日本語の質問応答システムのサンプル",
                    "ja": "Haystack + Elasticsearch + wikipedia(ja) を用いた、日本語の質問応答システムのサンプル\nヘイスタック + エラスティックサーチ + Wikipedia(ja) を使用した、日本語の質問応答システムのサンプル",
                    "zh-hans": "使用Haystack + Elasticsearch + wikipedia(ja)构建的日语问答系统示例",
                    "zh-hant": "使用Haystack + Elasticsearch + wikipedia(ja)構建的日語問答系統的示例"
                }
            },
            "https://github.com/google/mozc-devices": {
                "sub_category": null,
                "repository_name": "mozc-devices",
                "user_name": "google",
                "description": "Automatically exported from code.google.com/p/mozc-morse",
                "multilingual_descriptions": {
                    "en": "Automatically exported from code.google.com/p/mozc-morse",
                    "ja": "自動的にcode.google.com/p/mozc-morseからエクスポートされました。",
                    "zh-hans": "自动从code.google.com/p/mozc-morse导出",
                    "zh-hant": "自動從code.google.com/p/mozc-morse匯出"
                }
            },
            "https://github.com/faruzan0820/natsume": {
                "sub_category": null,
                "repository_name": "natsume",
                "user_name": "faruzan0820",
                "description": "A Japanese text frontend processing toolkit",
                "multilingual_descriptions": {
                    "en": "A Japanese text frontend processing toolkit",
                    "ja": "日本語テキストフロントエンド処理ツールキット",
                    "zh-hans": "一个日文文本前端处理工具包",
                    "zh-hant": "一個日文文本前端處理工具包"
                }
            },
            "https://github.com/litagin02/vits-japros-webui": {
                "sub_category": null,
                "repository_name": "vits-japros-webui",
                "user_name": "litagin02",
                "description": "日本語TTS（VITS）の学習と音声合成のGradio WebUI",
                "multilingual_descriptions": {
                    "en": "日本語TTS（VITS）の学習と音声合成のGradio WebUI",
                    "ja": "日本語TTS（VITS）の学習と音声合成のGradio WebUI",
                    "zh-hans": "日本语TTS（VITS）的学习和音频合成的Gradio WebUI",
                    "zh-hant": "日本語TTS（VITS）的學習和音訊合成的Gradio WebUI\n日本語TTS（VITS）的學習和音訊合成的Gradio WebUI"
                }
            },
            "https://github.com/takuyaa/ja-law-parser": {
                "sub_category": null,
                "repository_name": "ja-law-parser",
                "user_name": "takuyaa",
                "description": "A Japanese law parser",
                "multilingual_descriptions": {
                    "en": "A Japanese law parser",
                    "ja": "日本の法律パーサー",
                    "zh-hans": "一个日本法律解析器",
                    "zh-hant": "一個日本法律解析器"
                }
            },
            "https://github.com/julius-speech/dictation-kit": {
                "sub_category": null,
                "repository_name": "dictation-kit",
                "user_name": "julius-speech",
                "description": "Japanese dictation kit using Julius",
                "multilingual_descriptions": {
                    "en": "日本語の音声認識キットを使用しているジュリウス",
                    "ja": "Juliusを使用した日本語音声認識キット",
                    "zh-hans": "使用Julius的日语口述套件",
                    "zh-hant": "使用Julius的日語口述套件"
                }
            },
            "https://github.com/Hiroshiba/julius4seg": {
                "sub_category": null,
                "repository_name": "julius4seg",
                "user_name": "Hiroshiba",
                "description": "Juliusを使ったセグメンテーション支援ツール",
                "multilingual_descriptions": {
                    "en": "Segmentation support tool using Julius",
                    "ja": "Juliusを使ったセグメンテーション支援ツール",
                    "zh-hans": "使用Julius的分割支援工具",
                    "zh-hant": "使用Julius的分割支援工具"
                }
            },
            "https://github.com/VOICEVOX/voicevox_engine": {
                "sub_category": null,
                "repository_name": "voicevox_engine",
                "user_name": "VOICEVOX",
                "description": "無料で使える中品質なテキスト読み上げソフトウェア、VOICEVOXの音声合成エンジン",
                "multilingual_descriptions": {
                    "en": "VOICEVOX is a high-quality text-to-speech software that can be used for free.",
                    "ja": "無料で使える中品質なテキスト読み上げソフトウェア、VOICEVOXの音声合成エンジン",
                    "zh-hans": "免费使用的中等质量的文本朗读软件，VOICEVOX的语音合成引擎",
                    "zh-hant": "免費使用的中等品質文字朗讀軟體，VOICEVOX的語音合成引擎"
                }
            },
            "https://github.com/tosiyuki/LLaVA-JP": {
                "sub_category": null,
                "repository_name": "LLaVA-JP",
                "user_name": "tosiyuki",
                "description": "LLaVA-JP is a Japanese VLM trained by LLaVA method",
                "multilingual_descriptions": {
                    "en": "LLaVA-JP is a Japanese VLM trained by LLaVA method",
                    "ja": "LLaVA-JPは、LLaVAメソッドで訓練された日本のVLMです。",
                    "zh-hans": "LLaVA-JP是一种由LLaVA方法训练的日本VLM。",
                    "zh-hant": "LLaVA-JP 是一個由 LLaVA 方法訓練的日本 VLM。"
                }
            },
            "https://github.com/AkimParis/RAG-Japanese": {
                "sub_category": null,
                "repository_name": "RAG-Japanese",
                "user_name": "AkimParis",
                "description": "Open source RAG with Llama Index for Japanese LLM in low resource settting",
                "multilingual_descriptions": {
                    "en": "Open source RAG with Llama Index for Japanese LLM in low resource settting",
                    "ja": "日本の低資源設定での日本語LLM用のオープンソースRAGとLlama Index",
                    "zh-hans": "用于日本低资源环境中的开源RAG和Llama指数的LLM",
                    "zh-hant": "用於低資源環境下的日本LLM的開源RAG與Llama指數"
                }
            },
            "https://github.com/er-ri/bertjsc": {
                "sub_category": null,
                "repository_name": "bertjsc",
                "user_name": "er-ri",
                "description": "Japanese Spelling Error Corrector using BERT(Masked-Language Model). BERTに基づいて日本語校正",
                "multilingual_descriptions": {
                    "en": "Japanese Spelling Error Corrector using BERT(Masked-Language Model). BERTに基づいて日本語校正",
                    "ja": "BERTを使用した日本語スペルエラー修正ツール",
                    "zh-hans": "使用BERT（遮蔽语言模型）的日语拼写错误校正器。基于BERT的日语校正器。",
                    "zh-hant": "使用BERT（遮罩語言模型）的日語拼寫錯誤修正器。基於BERT的日語校正。"
                }
            },
            "https://github.com/wandb/llm-leaderboard": {
                "sub_category": null,
                "repository_name": "llm-leaderboard",
                "user_name": "wandb",
                "description": "Project of llm evaluation to Japanese tasks",
                "multilingual_descriptions": {
                    "en": "Project of llm evaluation to Japanese tasks",
                    "ja": "日本のタスクのLLM評価プロジェクト",
                    "zh-hans": "日本任务的llm评估项目",
                    "zh-hant": "日本任務的llm評估項目"
                }
            },
            "https://github.com/nobu-g/jglue-evaluation-scripts": {
                "sub_category": null,
                "repository_name": "jglue-evaluation-scripts",
                "user_name": "nobu-g",
                "description": "About",
                "multilingual_descriptions": {
                    "en": "About Training and evaluation scripts for JGLUE, a Japanese language understanding benchmark",
                    "ja": "JGLUEのトレーニングと評価スクリプトについて、日本語理解のベンチマークに関して\nJGLUEは、日本語理解のベンチマークのためのトレーニングと評価スクリプトについての情報です。",
                    "zh-hans": "关于JGLUE的培训和评估脚本，这是一个日语理解基准测试。",
                    "zh-hant": "關於JGLUE的培訓和評估腳本，這是一個日語理解基準的項目。"
                }
            },
            "https://github.com/ZhaoPeiduo/BLIP2-Japanese": {
                "sub_category": null,
                "repository_name": "BLIP2-Japanese",
                "user_name": "ZhaoPeiduo",
                "description": "Modifying LAVIS' BLIP2 Q-former with models pretrained on Japanese datasets.",
                "multilingual_descriptions": {
                    "en": "Modifying LAVIS' BLIP2 Q-former with models pretrained on Japanese datasets.",
                    "ja": "日本のデータセットで事前学習されたモデルを使用して、LAVISのBLIP2 Q-formerを修正します。\nLAVISのBLIP2 Q-formerを日本のデータセットで事前学習されたモデルを用いて修正します。",
                    "zh-hans": "使用在日本数据集上预训练的模型来修改LAVIS的BLIP2 Q-former。",
                    "zh-hant": "使用在日本數據集上預訓練的模型，修改LAVIS的BLIP2 Q-former。"
                }
            },
            "https://github.com/hotchpotch/wikipedia-passages-jawiki-embeddings-utils": {
                "sub_category": null,
                "repository_name": "wikipedia-passages-jawiki-embeddings-utils",
                "user_name": "hotchpotch",
                "description": "wikipedia 日本語の文を、各種日本語の embeddings や faiss index へと変換するスクリプト等。",
                "multilingual_descriptions": {
                    "en": "wikipedia 日本語の文を、各種日本語の embeddings や faiss index へと変換するスクリプト等。",
                    "ja": "wikipedia 日本語の文を、各種日本語の embeddings や faiss index へと変換するスクリプト等。",
                    "zh-hans": "wikipedia 日本语的文本转换为各种日本语嵌入和faiss索引的脚本等。",
                    "zh-hant": "將維基百科的日文句子轉換為各種日文嵌入和faiss索引的腳本等。"
                }
            },
            "https://github.com/hpprc/simple-simcse-ja": {
                "sub_category": null,
                "repository_name": "simple-simcse-ja",
                "user_name": "hpprc",
                "description": "Exploring Japanese SimCSE",
                "multilingual_descriptions": {
                    "en": "Exploring Japanese SimCSE",
                    "ja": "日本語のSimCSEを探索中",
                    "zh-hans": "探索日本SimCSE",
                    "zh-hant": "探索日本SimCSE"
                }
            },
            "https://github.com/lawofcycles/wikipedia-japanese-open-rag": {
                "sub_category": null,
                "repository_name": "wikipedia-japanese-open-rag",
                "user_name": "lawofcycles",
                "description": "Wikipediaの日本語記事を元に、ユーザの質問に回答するGradioベースのRAGのサンプル",
                "multilingual_descriptions": {
                    "en": "Sample RAG based on Gradio to answer user questions using Japanese Wikipedia articles",
                    "ja": "Wikipediaの日本語記事を元に、ユーザの質問に回答するGradioベースのRAGのサンプル",
                    "zh-hans": "基于Wikipedia日语文章的Gradio基础RAG示例，用于回答用户问题。",
                    "zh-hant": "根據Wikipedia的日文文章，回答用戶問題的Gradio基於RAG的示例。"
                }
            },
            "https://github.com/northern-system-service/gpt4-autoeval": {
                "sub_category": null,
                "repository_name": "gpt4-autoeval",
                "user_name": "northern-system-service",
                "description": "GPT-4 を用いて、言語モデルの応答を自動評価するスクリプト",
                "multilingual_descriptions": {
                    "en": "Script for automatically evaluating language model responses using GPT-4.",
                    "ja": "GPT-4 を用いて、言語モデルの応答を自動評価するスクリプト",
                    "zh-hans": "使用GPT-4来自动评估语言模型的响应的脚本",
                    "zh-hant": "使用GPT-4來自動評估語言模型的回應腳本"
                }
            },
            "https://github.com/sonoisa/t5-japanese": {
                "sub_category": null,
                "repository_name": "t5-japanese",
                "user_name": "sonoisa",
                "description": "日本語T5モデル",
                "multilingual_descriptions": {
                    "en": "Japanese T5 model",
                    "ja": "日本語T5モデル",
                    "zh-hans": "日语T5模型",
                    "zh-hant": "日語T5模型"
                }
            },
            "https://github.com/lightblue-tech/japanese_llm_eval": {
                "sub_category": null,
                "repository_name": "japanese_llm_eval",
                "user_name": "lightblue-tech",
                "description": "A repo for evaluating Japanese LLMs　・　日本語LLMを評価するレポ",
                "multilingual_descriptions": {
                    "en": "A repo for evaluating Japanese LLMs　・　日本語LLMを評価するレポ",
                    "ja": "日本語LLMを評価するためのリポジトリ",
                    "zh-hans": "用于评估日本语LLM的存储库",
                    "zh-hant": "用於評估日本語LLM的存儲庫 ・ 評估日本語LLM的存儲庫"
                }
            },
            "https://github.com/sbintuitions/jmteb": {
                "sub_category": null,
                "repository_name": "jmteb",
                "user_name": "sbintuitions",
                "description": "The evaluation scripts of JMTEB (Japanese Massive Text Embedding Benchmark)",
                "multilingual_descriptions": {
                    "en": "The evaluation scripts of JMTEB (Japanese Massive Text Embedding Benchmark)",
                    "ja": "JMTEB（日本語大規模テキスト埋め込みベンチマーク）の評価スクリプト",
                    "zh-hans": "JMTEB（日本大规模文本嵌入基准测试）的评估脚本",
                    "zh-hant": "JMTEB（日本大规模文本嵌入基准测试）的评估脚本"
                }
            },
            "https://github.com/dwangomediavillage/pydomino": {
                "sub_category": null,
                "repository_name": "pydomino",
                "user_name": "dwangomediavillage",
                "description": "日本語音声に対して音素ラベルをアラインメントするためのツールです",
                "multilingual_descriptions": {
                    "en": "This is a tool for aligning phoneme labels with Japanese language audio.",
                    "ja": "日本語音声に対して音素ラベルをアラインメントするためのツールです",
                    "zh-hans": "这是一个用于对日语语音进行音素标签对齐的工具。",
                    "zh-hant": "這是一個用於對日語語音進行音素標籤對齊的工具。"
                }
            },
            "https://github.com/zuntan03/easynovelassistant": {
                "sub_category": null,
                "repository_name": "easynovelassistant",
                "user_name": "zuntan03",
                "description": "軽量で規制も検閲もない日本語ローカル LLM『LightChatAssistant-TypeB』による、簡単なノベル生成アシスタントです。ローカル特権の永続生成 Generate forever で、当たりガチャを積み上げます。読み上げにも対応。",
                "multilingual_descriptions": {
                    "en": "This is a simple novel generation assistant using the lightweight and unregulated Japanese local LLM \"LightChatAssistant-TypeB\". It generates forever with local privileges, stacking up hit gachas. It also supports reading aloud.",
                    "ja": "軽量で規制も検閲もない日本語ローカル LLM『LightChatAssistant-TypeB』による、簡単なノベル生成アシスタントです。ローカル特権の永続生成 Generate forever で、当たりガチャを積み上げます。読み上げにも対応。",
                    "zh-hans": "轻量且无限制和审查的日语本地LLM“LightChatAssistant-TypeB”提供简易小说生成助手。通过本地特权的永久生成功能，堆积中奖抽奖。支持朗读功能。",
                    "zh-hant": "輕量且無規制和審查的日語本地 LLM『LightChatAssistant-TypeB』所提供的簡單小說生成助手。利用本地特權永久生成，堆積中獎的 Gacha。支援朗讀功能。"
                }
            },
            "https://github.com/sonoisa/clip-japanese": {
                "sub_category": null,
                "repository_name": "clip-japanese",
                "user_name": "sonoisa",
                "description": "日本語データセットでのqlora instruction tuning学習サンプルコード",
                "multilingual_descriptions": {
                    "en": "Japanese CLIP model",
                    "ja": "日本語CLIPモデル",
                    "zh-hans": "日语CLIP模型",
                    "zh-hant": "日語CLIP模型"
                }
            },
            "https://github.com/lazyfoxchan/rime-jaroomaji": {
                "sub_category": null,
                "repository_name": "rime-jaroomaji",
                "user_name": "lazyfoxchan",
                "description": "Japanese rōmaji input schema for Rime IME",
                "multilingual_descriptions": {
                    "en": "Japanese rōmaji input schema for Rime IME",
                    "ja": "Rime IMEのための日本語ローマ字入力スキーマ",
                    "zh-hans": "Rime输入法的日语罗马字输入方案",
                    "zh-hant": "Rime IME 的日文羅馬拼音輸入方案"
                }
            },
            "https://github.com/sonoisa/deep-question-generation": {
                "sub_category": null,
                "repository_name": "deep-question-generation",
                "user_name": "sonoisa",
                "description": "深層学習を用いたクイズ自動生成（日本語T5モデル）",
                "multilingual_descriptions": {
                    "en": "Quiz automatic generation using deep learning (Japanese T5 model)",
                    "ja": "深層学習を用いたクイズ自動生成（日本語T5モデル）",
                    "zh-hans": "使用深度学习生成的自动化测验（日语T5模型）",
                    "zh-hant": "使用深度學習生成的測驗（日語T5模型）"
                }
            },
            "https://github.com/aratako/magpie-nemotron": {
                "sub_category": null,
                "repository_name": "magpie-nemotron",
                "user_name": "aratako",
                "description": "Magpieという手法とNemotron-4-340B-Instructを用いて合成対話データセットを作るコード",
                "multilingual_descriptions": {
                    "en": "Code to create a synthetic dialogue dataset using the technique called Magpie and Nemotron-4-340B-Instruct.",
                    "ja": "Magpieという手法とNemotron-4-340B-Instructを用いて合成対話データセットを作るコード",
                    "zh-hans": "使用Magpie技术和Nemotron-4-340B-Instruct创建合成对话数据集的代码",
                    "zh-hant": "使用Magpie技術和Nemotron-4-340B-Instruct來創建合成對話數據集的代碼"
                }
            },
            "https://github.com/sosuke115/qlora_ja": {
                "sub_category": null,
                "repository_name": "qlora_ja",
                "user_name": "sosuke115",
                "description": "日本語データセットでのqlora instruction tuning学習サンプルコード",
                "multilingual_descriptions": {
                    "en": "Sample code for qlora instruction tuning learning in a Japanese dataset.",
                    "ja": "日本語データセットでのqlora instruction tuning学習サンプルコード",
                    "zh-hans": "在日语数据集上进行qlora指令调整的学习示例代码",
                    "zh-hant": "在日本語數據集中進行qlora指令調整學習的示例代碼"
                }
            },
            "https://github.com/utuhiro78/mozcdic-ut-jawiki": {
                "sub_category": null,
                "repository_name": "mozcdic-ut-jawiki",
                "user_name": "utuhiro78",
                "description": "Mozc UT Jawiki Dictionary is a dictionary generated from the Japanese Wikipedia for Mozc.",
                "multilingual_descriptions": {
                    "en": "Mozc UT Jawiki Dictionary is a dictionary generated from the Japanese Wikipedia for Mozc.",
                    "ja": "Mozc UT Jawiki辞書は、Mozc用に日本語のWikipediaから生成された辞書です。",
                    "zh-hans": "Mozc UT Jawiki词典是从日文维基百科为Mozc生成的词典。",
                    "zh-hant": "Mozc UT Jawiki 字典是從日文維基百科生成的字典，用於 Mozc。"
                }
            },
            "https://github.com/shisa-ai/shisa-v2": {
                "sub_category": null,
                "repository_name": "shisa-v2",
                "user_name": "shisa-ai",
                "description": "Japanese / English Bilingual LLM",
                "multilingual_descriptions": {
                    "en": "Japanese / English Bilingual LLM",
                    "ja": "日本語/英語バイリンガルLLM",
                    "zh-hans": "日英双语法学硕士",
                    "zh-hant": "日英雙語法學碩士"
                }
            },
            "https://github.com/hpprc/llm-translator": {
                "sub_category": null,
                "repository_name": "llm-translator",
                "user_name": "hpprc",
                "description": "Mixtral-based Ja-En (En-Ja) Translation model",
                "multilingual_descriptions": {
                    "en": "Mixtral-based Ja-En (En-Ja) Translation model",
                    "ja": "ミクストラルベースの日英（英日）翻訳モデル",
                    "zh-hans": "基于Mixtral的Ja-En（En-Ja）翻译模型",
                    "zh-hant": "基於Mixtral的Ja-En（En-Ja）翻譯模型"
                }
            },
            "https://github.com/tosiyuki/llm-jp-asr": {
                "sub_category": null,
                "repository_name": "llm-jp-asr",
                "user_name": "tosiyuki",
                "description": "Whisperのデコーダをllm-jp-1.3b-v1.0に置き換えた音声認識モデルを学習させるためのコード",
                "multilingual_descriptions": {
                    "en": "Code for training a speech recognition model using a Whisper decoder replaced with llm-jp-1.3b-v1.0.",
                    "ja": "Whisperのデコーダをllm-jp-1.3b-v1.0に置き換えた音声認識モデルを学習させるためのコード",
                    "zh-hans": "将Whisper的解码器替换为llm-jp-1.3b-v1.0版本的语音识别模型的学习代码",
                    "zh-hant": "將Whisper的解碼器替換為llm-jp-1.3b-v1.0版本的語音識別模型的學習代碼。"
                }
            },
            "https://github.com/akimfromparis/rag-japanese": {
                "sub_category": null,
                "repository_name": "rag-japanese",
                "user_name": "akimfromparis",
                "description": "Open source RAG with Llama Index for Japanese LLM in low resource settting",
                "multilingual_descriptions": {
                    "en": "Open source RAG with Llama Index for Japanese LLM in low resource settting",
                    "ja": "日本の低リソース環境でのLLM向けのラマ指数付きのオープンソースRAG",
                    "zh-hans": "在资源匮乏的环境中，使用Llama指数为日本LLM开源的RAG",
                    "zh-hant": "在資源有限的環境中，使用羊駝指數為日本LLM開源的RAG"
                }
            },
            "https://github.com/komiya-lab/monaka": {
                "sub_category": null,
                "repository_name": "monaka",
                "user_name": "komiya-lab",
                "description": "A Japanese Parser (including historical Japanese)",
                "multilingual_descriptions": {
                    "en": "A Japanese Parser (including historical Japanese)",
                    "ja": "日本語パーサー（歴史的な日本語を含む）",
                    "zh-hans": "一个日语解析器（包括历史日语）",
                    "zh-hant": "一個日本語解析器（包括歷史日本語）"
                }
            },
            "https://github.com/matthewbieda/jp-translate.cloud": {
                "sub_category": null,
                "repository_name": "jp-translate.cloud",
                "user_name": "matthewbieda",
                "description": "A state-of-the-art open-source Japanese <--> English machine translation system based on the latest NMT research.",
                "multilingual_descriptions": {
                    "en": "A state-of-the-art open-source Japanese <--> English machine translation system based on the latest NMT research.",
                    "ja": "最新のNMT研究に基づいた最先端のオープンソース日本語<-->英語機械翻訳システム。",
                    "zh-hans": "基于最新的NMT研究，采用最先进的开源日语<-->英语机器翻译系统。",
                    "zh-hant": "一個基於最新的NMT研究的最先進的開源日語<-->英語機器翻譯系統。"
                }
            },
            "https://github.com/toufu-24/substring-word-finder": {
                "sub_category": null,
                "repository_name": "substring-word-finder",
                "user_name": "toufu-24",
                "description": "連続部分文字列の単語判定を行います",
                "multilingual_descriptions": {
                    "en": "Perform word judgment on consecutive substring.",
                    "ja": "連続部分文字列の単語判定を行います",
                    "zh-hans": "进行连续子字符串的单词判断",
                    "zh-hant": "連續部分字串的單詞判定。"
                }
            },
            "https://github.com/wandb/heron-vlm-leaderboard": {
                "sub_category": null,
                "repository_name": "heron-vlm-leaderboard",
                "user_name": "wandb",
                "description": "This project is a benchmarking tool for evaluating and comparing the performance of various Vision Language Models (VLMs). It uses two datasets: LLaVA-Bench-In-the-Wild and Japanese HERON Bench to measure model performance.",
                "multilingual_descriptions": {
                    "en": "This project is a benchmarking tool for evaluating and comparing the performance of various Vision Language Models (VLMs). It uses two datasets: LLaVA-Bench-In-the-Wild and Japanese HERON Bench to measure model performance.",
                    "ja": "このプロジェクトは、さまざまなビジョン言語モデル（VLMs）のパフォーマンスを評価および比較するためのベンチマークツールです。モデルのパフォーマンスを測定するために、LLaVA-Bench-In-the-WildとJapanese HERON Benchの2つのデータセットを使用しています。",
                    "zh-hans": "这个项目是一个基准工具，用于评估和比较各种视觉语言模型（VLMs）的性能。它使用两个数据集：LLaVA-Bench-In-the-Wild和日本HERON Bench来衡量模型的性能。",
                    "zh-hant": "這個項目是一個基準工具，用於評估和比較各種視覺語言模型（VLMs）的性能。它使用兩個數據集：LLaVA-Bench-In-the-Wild 和日本 HERON Bench 來衡量模型的性能。"
                }
            },
            "https://github.com/llm-jp/text2dataset": {
                "sub_category": null,
                "repository_name": "text2dataset",
                "user_name": "llm-jp",
                "description": "Easily turn large English text datasets into Japanese text datasets using open LLMs.",
                "multilingual_descriptions": {
                    "en": "Easily turn large English text datasets into Japanese text datasets using open LLMs.",
                    "ja": "簡単に大きな英語テキストデータセットを日本語テキストデータセットに変換できます。オープンLLMsを使用してください。",
                    "zh-hans": "使用开放的LLMs轻松将大型英文文本数据集转换为日文文本数据集。",
                    "zh-hant": "使用開放式LLM輕鬆將大型英文文本數據集轉換為日文文本數據集。"
                }
            },
            "https://github.com/bungoume/mecab-web-api": {
                "sub_category": null,
                "repository_name": "mecab-web-api",
                "user_name": "bungoume",
                "description": "MeCabを利用した日本語形態素解析WebAPI",
                "multilingual_descriptions": {
                    "en": "Japanese Morphological Analysis Web API using MeCab",
                    "ja": "MeCabを利用した日本語形態素解析WebAPI",
                    "zh-hans": "使用MeCab的日语形态素解析WebAPI",
                    "zh-hant": "使用MeCab的日語形態素解析WebAPI"
                }
            },
            "https://github.com/ajatt-tools/mecab_controller": {
                "sub_category": null,
                "repository_name": "mecab_controller",
                "user_name": "ajatt-tools",
                "description": "Mecab wrapper to generate furigana readings.",
                "multilingual_descriptions": {
                    "en": "Mecab wrapper to generate furigana readings.",
                    "ja": "ふりがな読みを生成するためのMecabラッパー",
                    "zh-hans": "用于生成振り仮名读音的Mecab包装器。",
                    "zh-hant": "Mecab包裝器生成振り仮名讀音。"
                }
            },
            "https://github.com/zassou65535/vits": {
                "sub_category": null,
                "repository_name": "vits",
                "user_name": "zassou65535",
                "description": "VITSによるテキスト読み上げ器&ボイスチェンジャー",
                "multilingual_descriptions": {
                    "en": "Text-to-speech engine and voice changer by VITS",
                    "ja": "VITSによるテキスト読み上げ器&ボイスチェンジャー",
                    "zh-hans": "VITS文本朗读器和声音变换器",
                    "zh-hant": "VITS提供的文字朗讀器和聲音變換器"
                }
            },
            "https://github.com/akarigroup/akari_chatgpt_bot": {
                "sub_category": null,
                "repository_name": "akari_chatgpt_bot",
                "user_name": "akarigroup",
                "description": "音声認識、文章生成、音声合成を使って対話するチャットボットアプリ",
                "multilingual_descriptions": {
                    "en": "Chatbot application that uses speech recognition, text generation, and speech synthesis for dialogue.",
                    "ja": "音声認識、文章生成、音声合成を使って対話するチャットボットアプリ",
                    "zh-hans": "使用语音识别、文章生成和语音合成进行对话的聊天机器人应用程序",
                    "zh-hant": "使用語音識別、文章生成和語音合成進行對話的聊天機器人應用程式"
                }
            },
            "https://github.com/bikatr7/kudasai": {
                "sub_category": null,
                "repository_name": "kudasai",
                "user_name": "bikatr7",
                "description": "Streamlining Japanese-English Translation with Advanced Preprocessing and Integrated Translation Technologies",
                "multilingual_descriptions": {
                    "en": "Streamlining Japanese-English Translation with Advanced Preprocessing and Integrated Translation Technologies",
                    "ja": "高度な前処理と統合された翻訳技術を活用して、日本語-英語翻訳を効率化する",
                    "zh-hans": "利用先进的预处理和集成翻译技术简化日英翻译",
                    "zh-hant": "利用先進的預處理和集成翻譯技術來優化日英翻譯流程"
                }
            },
            "https://github.com/sophiefy/mecab-visualizer": {
                "sub_category": null,
                "repository_name": "mecab-visualizer",
                "user_name": "sophiefy",
                "description": "MeCabの形態素解析結果を可視化するツール",
                "multilingual_descriptions": {
                    "en": "Tool to visualize the morphological analysis results of MeCab",
                    "ja": "MeCabの形態素解析結果を可視化するツール",
                    "zh-hans": "使用MeCab进行词素分析结果可视化的工具",
                    "zh-hant": "使用MeCab進行詞彙分析結果的可視化工具"
                }
            },
            "https://github.com/massao000/add-dictionary": {
                "sub_category": null,
                "repository_name": "add-dictionary",
                "user_name": "massao000",
                "description": "OpenJTalkのユーザ辞書をGUIで追加するアプリ",
                "multilingual_descriptions": {
                    "en": "An app to add user dictionaries for OpenJTalk using a GUI.",
                    "ja": "OpenJTalkのユーザ辞書をGUIで追加するアプリ",
                    "zh-hans": "使用GUI添加OpenJTalk用户词典的应用程序",
                    "zh-hant": "使用GUI添加OpenJTalk用户词典的应用程序"
                }
            },
            "https://github.com/nu-dialogue/j-moshi": {
                "sub_category": null,
                "repository_name": "j-moshi",
                "user_name": "nu-dialogue",
                "description": "J-Moshi: A Japanese Full-duplex Spoken Dialogue System",
                "multilingual_descriptions": {
                    "en": "J-Moshi: A Japanese Full-duplex Spoken Dialogue System",
                    "ja": "J-Moshi: 日本語のフルデュプレックス音声対話システム",
                    "zh-hans": "J-Moshi：一个日本全双工口语对话系统",
                    "zh-hant": "J-Moshi：一個日本全雙工口語對話系統"
                }
            },
            "https://github.com/unilight/jatts": {
                "sub_category": null,
                "repository_name": "jatts",
                "user_name": "unilight",
                "description": "JATTS: Japanese TTS (for research)",
                "multilingual_descriptions": {
                    "en": "JATTS: Japanese TTS (for research)",
                    "ja": "JATTS: 日本語TTS（研究用）",
                    "zh-hans": "JATTS: 日语TTS（用于研究）",
                    "zh-hant": "JATTS: 日文TTS（用於研究）"
                }
            }
        },
        "C++": {
            "https://github.com/taku910/mecab": {
                "sub_category": "Morphology analysis",
                "repository_name": "mecab",
                "user_name": "taku910",
                "description": "Yet another Japanese morphological analyzer",
                "multilingual_descriptions": {
                    "en": "Yet another Japanese morphological analyzer",
                    "ja": "もう一つの日本語形態素解析器",
                    "zh-hans": "又一个日语形态分析器",
                    "zh-hant": "又一個日本語形態分析器"
                }
            },
            "https://github.com/ku-nlp/jumanpp": {
                "sub_category": "Morphology analysis",
                "repository_name": "jumanpp",
                "user_name": "ku-nlp",
                "description": "Juman++ (a Morphological Analyzer Toolkit)",
                "multilingual_descriptions": {
                    "en": "Juman++ (a Morphological Analyzer Toolkit)",
                    "ja": "Juman++（形態素解析ツールキット）",
                    "zh-hans": "Juman++（一个形态分析工具包）",
                    "zh-hant": "Juman++（一個形態學分析工具包）"
                }
            },
            "https://github.com/neubig/kytea": {
                "sub_category": "Morphology analysis",
                "repository_name": "kytea",
                "user_name": "neubig",
                "description": "The Kyoto Text Analysis Toolkit for word segmentation and pronunciation estimation, etc.",
                "multilingual_descriptions": {
                    "en": "The Kyoto Text Analysis Toolkit for word segmentation and pronunciation estimation, etc.",
                    "ja": "京都テキスト分析ツールキット：単語分割や発音推定などに使用されます。",
                    "zh-hans": "京都文本分析工具包，用于词语分割和发音估计等。",
                    "zh-hant": "京都文本分析工具箱，可用於詞語分割和發音估計等。"
                }
            },
            "https://github.com/taku910/cabocha": {
                "sub_category": "Parsing",
                "repository_name": "cabocha",
                "user_name": "taku910",
                "description": "Yet Another Japanese Dependency Structure Analyzer",
                "multilingual_descriptions": {
                    "en": "Yet Another Japanese Dependency Structure Analyzer",
                    "ja": "もう一つの日本語依存構造解析ツール",
                    "zh-hans": "另一个日语依存结构分析器",
                    "zh-hant": "另一個日本依存結構分析器"
                }
            },
            "https://github.com/ku-nlp/knp": {
                "sub_category": "Parsing",
                "repository_name": "knp",
                "user_name": "ku-nlp",
                "description": "A Japanese Parser",
                "multilingual_descriptions": {
                    "en": "A Japanese Parser",
                    "ja": "日本語パーサー",
                    "zh-hans": "一个日语解析器",
                    "zh-hant": "一個日語解析器"
                }
            },
            "https://github.com/yohokuno/jsc": {
                "sub_category": null,
                "repository_name": "jsc",
                "user_name": "yohokuno",
                "description": "Joint source channel model for Japanese Kana Kanji conversion, Chinese pinyin input and CJE mixed input.",
                "multilingual_descriptions": {
                    "en": "Joint source channel model for Japanese Kana Kanji conversion, Chinese pinyin input and CJE mixed input.",
                    "ja": "日本語の仮名漢字変換、中国語のピンイン入力、CJE混合入力のための共通ソースチャネルモデル。",
                    "zh-hans": "联合源通道模型用于日语假名汉字转换、汉语拼音输入和CJE混合输入。",
                    "zh-hant": "日文假名漢字轉換、中文拼音輸入和CJE混合輸入的聯合源通道模型。"
                }
            },
            "https://github.com/codefirst/aquaskk": {
                "sub_category": null,
                "repository_name": "aquaskk",
                "user_name": "codefirst",
                "description": "An input method without morphological analysis.",
                "multilingual_descriptions": {
                    "en": "An input method without morphological analysis.",
                    "ja": "形態素解析を行わない入力方法。",
                    "zh-hans": "没有形态分析的输入法。",
                    "zh-hant": "沒有形態學分析的輸入法。"
                }
            },
            "https://github.com/google/mozc": {
                "sub_category": null,
                "repository_name": "mozc",
                "user_name": "google",
                "description": "a Japanese Input Method Editor designed for multi-platform",
                "multilingual_descriptions": {
                    "en": "Mozc - a Japanese Input Method Editor designed for multi-platform",
                    "ja": "Mozc - マルチプラットフォームに対応した日本語入力システムエディター",
                    "zh-hans": "Mozc - 一款为多平台设计的日语输入法编辑器",
                    "zh-hant": "Mozc - 一款為多平台設計的日本輸入法編輯器"
                }
            },
            "https://github.com/tuem/trimatch": {
                "sub_category": null,
                "repository_name": "trimatch",
                "user_name": "tuem",
                "description": "Trimatch: An (Exact|Prefix|Approximate) String Matching Library",
                "multilingual_descriptions": {
                    "en": "Trimatch: An (Exact|Prefix|Approximate) String Matching Library",
                    "ja": "Trimatch：（完全|接頭辞|近似）文字列マッチングライブラリ",
                    "zh-hans": "Trimatch：一个（精确|前缀|近似）字符串匹配库",
                    "zh-hant": "Trimatch：一個（精確|前綴|近似）字串匹配庫"
                }
            },
            "https://github.com/tuem/resembla": {
                "sub_category": null,
                "repository_name": "resembla",
                "user_name": "tuem",
                "description": "Resembla: Word-based Japanese similar sentence search library",
                "multilingual_descriptions": {
                    "en": "Resembla: Word-based Japanese similar sentence search library",
                    "ja": "Resembla：単語ベースの日本語類似文検索ライブラリ",
                    "zh-hans": "Resembla：基于单词的日语相似句子搜索库",
                    "zh-hant": "Resembla：基於單詞的日語相似句子搜索庫"
                }
            },
            "https://github.com/nathancorvussolis/corvusskk": {
                "sub_category": null,
                "repository_name": "corvusskk",
                "user_name": "nathancorvussolis",
                "description": "▽▼ SKK-like Japanese Input Method Editor for Windows",
                "multilingual_descriptions": {
                    "en": "▽▼ SKK-like Japanese Input Method Editor for Windows",
                    "ja": "▽▼ Windows用のSKK風日本語入力エディタ",
                    "zh-hans": "▽▼ 适用于Windows的类似SKK的日语输入法编辑器",
                    "zh-hant": "▽▼ Windows 的 SKK-like 日文輸入法編輯器"
                }
            }
        },
        "Rust crate": {
            "https://github.com/lindera-morphology/lindera": {
                "sub_category": "Morphology analysis",
                "repository_name": "lindera",
                "user_name": "lindera-morphology",
                "description": "A morphological analysis library.",
                "multilingual_descriptions": {
                    "en": "A morphological analysis library.",
                    "ja": "形態素解析ライブラリ。",
                    "zh-hans": "一个形态分析库。",
                    "zh-hant": "一個形態學分析庫。"
                }
            },
            "https://github.com/daac-tools/vaporetto": {
                "sub_category": "Morphology analysis",
                "repository_name": "vaporetto",
                "user_name": "daac-tools",
                "description": "Vaporetto: Very Accelerated POintwise pREdicTion based TOkenizer",
                "multilingual_descriptions": {
                    "en": "Vaporetto: Very Accelerated POintwise pREdicTion based TOkenizer",
                    "ja": "Vaporetto：非常に加速されたポイントワイズ予測に基づくトークナイザー",
                    "zh-hans": "Vaporetto：基于点预测的加速分词器",
                    "zh-hant": "Vaporetto：基於點預測的高速分詞器"
                }
            },
            "https://github.com/Leko/goya": {
                "sub_category": "Morphology analysis",
                "repository_name": "goya",
                "user_name": "Leko",
                "description": "Japanese Morphological Analysis written in Rust",
                "multilingual_descriptions": {
                    "en": "Japanese Morphological Analysis written in Rust",
                    "ja": "Rustで書かれた日本語形態素解析",
                    "zh-hans": "用Rust编写的日语形态分析",
                    "zh-hant": "用 Rust 寫的日語形態分析"
                }
            },
            "https://github.com/daac-tools/vibrato": {
                "sub_category": "Morphology analysis",
                "repository_name": "vibrato",
                "user_name": "daac-tools",
                "description": "vibrato: Viterbi-based accelerated tokenizer",
                "multilingual_descriptions": {
                    "en": "vibrato: Viterbi-based accelerated tokenizer",
                    "ja": "バイブラート：Viterbiベースの高速トークナイザー",
                    "zh-hans": "颤音：基于维特比加速的分词器",
                    "zh-hant": "顫音：基於維特比加速的分詞器"
                }
            },
            "https://github.com/agatan/yoin": {
                "sub_category": "Morphology analysis",
                "repository_name": "yoin",
                "user_name": "agatan",
                "description": "A Japanese Morphological Analyzer written in pure Rust",
                "multilingual_descriptions": {
                    "en": "A Japanese Morphological Analyzer written in pure Rust",
                    "ja": "純粋なRustで書かれた日本語形態素解析器",
                    "zh-hans": "一个用纯Rust编写的日语形态分析器",
                    "zh-hant": "一個用純 Rust 編寫的日語形態分析器"
                }
            },
            "https://github.com/tsurai/mecab-rs": {
                "sub_category": "Morphology analysis",
                "repository_name": "mecab-rs",
                "user_name": "tsurai",
                "description": "Safe Rust bindings for mecab a part-of-speech and morphological analyzer library",
                "multilingual_descriptions": {
                    "en": "Safe Rust bindings for mecab a part-of-speech and morphological analyzer library",
                    "ja": "「mecab」の安全なRustバインディング。品詞と形態素解析ライブラリ。",
                    "zh-hans": "安全的Rust绑定，用于mecab词性和形态分析库。",
                    "zh-hant": "安全的 Rust 綁定，用於 mecab 詞性和形態分析庫。"
                }
            },
            "https://github.com/nakagami/awabi": {
                "sub_category": "Morphology analysis",
                "repository_name": "awabi",
                "user_name": "nakagami",
                "description": "A morphological analyzer using mecab dictionary",
                "multilingual_descriptions": {
                    "en": "A morphological analyzer using mecab dictionary",
                    "ja": "MeCab辞書を使用する形態素解析器",
                    "zh-hans": "一个使用mecab字典的形态分析器",
                    "zh-hant": "一個使用mecab字典的形態分析器"
                }
            },
            "https://github.com/togatoga/kanpyo": {
                "sub_category": "Morphology analysis",
                "repository_name": "kanpyo",
                "user_name": "togatoga",
                "description": "Japanese Morphological Analyzer written in Rust",
                "multilingual_descriptions": {
                    "en": "Japanese Morphological Analyzer written in Rust",
                    "ja": "Rustで書かれた日本語形態素解析器",
                    "zh-hans": "用Rust编写的日语形态分析器",
                    "zh-hant": "用Rust编写的日语形态分析器"
                }
            },
            "https://github.com/PSeitz/wana_kana_rust": {
                "sub_category": "Converter",
                "repository_name": "wana_kana_rust",
                "user_name": "PSeitz",
                "description": "and Romaji",
                "multilingual_descriptions": {
                    "en": "Utility library for checking and converting between Japanese characters - Hiragana, Katakana - and Romaji",
                    "ja": "日本語の文字（ひらがな、カタカナ）とローマ字の間の変換とチェックを行うためのユーティリティライブラリ。",
                    "zh-hans": "用于检查和转换日语字符（平假名、片假名和罗马字）的实用程序库。",
                    "zh-hant": "檢查和轉換日文字符（平假名、片假名）和羅馬字的實用程式庫"
                }
            },
            "https://github.com/gemmarx/unicode-jp-rs": {
                "sub_category": "Converter",
                "repository_name": "unicode-jp-rs",
                "user_name": "gemmarx",
                "description": "A Rust library to convert Japanese Half-width-kana[半角ｶﾅ] and Wide-alphanumeric[全角英数] into normal ones",
                "multilingual_descriptions": {
                    "en": "A Rust library to convert Japanese Half-width-kana[半角ｶﾅ] and Wide-alphanumeric[全角英数] into normal ones",
                    "ja": "日本語の半角カナと全角英数字を通常の文字に変換するためのRustライブラリ",
                    "zh-hans": "一个 Rust 库，用于将日语半角假名和全角英数字转换为普通字符。",
                    "zh-hant": "一個 Rust 函式庫，可將日文半角ｶﾅ和全角英數轉換為正常字符。"
                }
            },
            "https://github.com/gbrlsnchs/kana": {
                "sub_category": "Converter",
                "repository_name": "kana",
                "user_name": "gbrlsnchs",
                "description": "[Mirror] CLI program for transliterating romaji text to either hiragana or katakana",
                "multilingual_descriptions": {
                    "en": "[Mirror] CLI program for transliterating romaji text to either hiragana or katakana",
                    "ja": "[ミラー] ローマ字テキストをひらがなまたはカタカナに変換するためのCLIプログラム",
                    "zh-hans": "【镜像】用于将罗马字文本转换为平假名或片假名的CLI程序。",
                    "zh-hant": "[鏡像] CLI 程序，可將羅馬字文本轉寫為平假名或片假名。"
                }
            },
            "https://github.com/samunohito/kanaria": {
                "sub_category": "Converter",
                "repository_name": "kanaria",
                "user_name": "samunohito",
                "description": "このライブラリは、ひらがな・カタカナ、半角・全角の相互変換や判別を始めとした機能を提供します。",
                "multilingual_descriptions": {
                    "en": "This library provides functions such as mutual conversion and discrimination of hiragana, katakana, half-width, and full-width characters.",
                    "ja": "このライブラリは、ひらがな・カタカナ、半角・全角の相互変換や判別を始めとした機能を提供します。",
                    "zh-hans": "这个库提供了平假名、片假名、半角和全角之间的相互转换和识别功能。",
                    "zh-hant": "這個程式庫提供了平假名、片假名、半形和全形之間的互相轉換和識別功能。"
                }
            },
            "https://github.com/yuukitoriyama/japanese-address-parser": {
                "sub_category": "Converter",
                "repository_name": "japanese-address-parser",
                "user_name": "yuukitoriyama",
                "description": "日本の住所を都道府県/市区町村/町名/その他に分割するライブラリです",
                "multilingual_descriptions": {
                    "en": "This is a library that splits Japanese addresses into prefecture/city or town/village/neighborhood/other.",
                    "ja": "日本の住所を都道府県/市区町村/町名/その他に分割するライブラリです",
                    "zh-hans": "这是一个将日本地址分割为都道府县/市区町村/町名/其他部分的库。",
                    "zh-hant": "日本的地址分割成都道府県/市區町村/町名/其他的程式庫"
                }
            },
            "https://github.com/lindera-morphology/lindera-tantivy": {
                "sub_category": "Search engine library",
                "repository_name": "lindera-tantivy",
                "user_name": "lindera-morphology",
                "description": "Lindera tokenizer for Tantivy.",
                "multilingual_descriptions": {
                    "en": "Lindera tokenizer for Tantivy.",
                    "ja": "Tantivy用のLinderaトークナイザー。",
                    "zh-hans": "Tantivy 的 Lindera 分词器。",
                    "zh-hant": "Lindera tokenizer for Tantivy. \n\n林德拉分詞器用於Tantivy。"
                }
            },
            "https://github.com/akr4/tantivy-vibrato": {
                "sub_category": "Search engine library",
                "repository_name": "tantivy-vibrato",
                "user_name": "akr4",
                "description": "A Tantivy tokenizer using Vibrato.",
                "multilingual_descriptions": {
                    "en": "A Tantivy tokenizer using Vibrato.",
                    "ja": "Vibratoを使用したTantivyトークナイザー。",
                    "zh-hans": "使用Vibrato的Tantivy分词器。",
                    "zh-hant": "使用 Vibrato 的 Tantivy 分詞器。"
                }
            },
            "https://github.com/daac-tools/daachorse": {
                "sub_category": null,
                "repository_name": "daachorse",
                "user_name": "daac-tools",
                "description": "A fast implementation of the Aho-Corasick algorithm using the compact double-array data structure in Rust.",
                "multilingual_descriptions": {
                    "en": "A fast implementation of the Aho-Corasick algorithm using the compact double-array data structure in Rust.",
                    "ja": "Rustでコンパクトなダブル配列データ構造を使用したAho-Corasickアルゴリズムの高速実装。",
                    "zh-hans": "使用Rust中的紧凑双数组数据结构快速实现Aho-Corasick算法。",
                    "zh-hant": "一個在 Rust 中使用緊湊的雙陣列資料結構實現 Aho-Corasick 算法的快速實現。"
                }
            },
            "https://github.com/legalforce-research/find-simdoc": {
                "sub_category": null,
                "repository_name": "find-simdoc",
                "user_name": "legalforce-research",
                "description": "Finding all pairs of similar documents time- and memory-efficiently",
                "multilingual_descriptions": {
                    "en": "Finding all pairs of similar documents time- and memory-efficiently",
                    "ja": "効率的な時間とメモリを使って、類似したドキュメントのすべてのペアを見つける。",
                    "zh-hans": "高效地找到所有相似文档的配对",
                    "zh-hant": "以時間和記憶體效率找出所有相似文件的配對"
                }
            },
            "https://github.com/daac-tools/crawdad": {
                "sub_category": null,
                "repository_name": "crawdad",
                "user_name": "daac-tools",
                "description": "Rust library of natural language dictionaries using character-wise double-array tries.",
                "multilingual_descriptions": {
                    "en": "Rust library of natural language dictionaries using character-wise double-array tries.",
                    "ja": "文字単位のダブル配列トライを使用した自然言語辞書のRustライブラリ。",
                    "zh-hans": "使用字符级双数组字典树的自然语言词典 Rust 库。",
                    "zh-hant": "使用字符雙陣列嘗試的自然語言字典的 Rust 函式庫。"
                }
            },
            "https://github.com/legalforce-research/tokenizer-speed-bench": {
                "sub_category": null,
                "repository_name": "tokenizer-speed-bench",
                "user_name": "legalforce-research",
                "description": "Comparison code of various tokenizers",
                "multilingual_descriptions": {
                    "en": " Comparison code of various tokenizers",
                    "ja": "様々なトークナイザーの比較コード",
                    "zh-hans": "各种分词器的比较代码",
                    "zh-hant": "各種分詞器的比較代碼"
                }
            },
            "https://github.com/legalforce-research/stringmatch-bench": {
                "sub_category": null,
                "repository_name": "stringmatch-bench",
                "user_name": "legalforce-research",
                "description": "Here provides benchmark tools to compare the performance of data structures for string matching.",
                "multilingual_descriptions": {
                    "en": "Here provides benchmark tools to compare the performance of data structures for string matching.",
                    "ja": "ここでは、文字列マッチングのデータ構造のパフォーマンスを比較するためのベンチマークツールが提供されています。",
                    "zh-hans": "这里提供基准工具来比较字符串匹配数据结构的性能。",
                    "zh-hant": "這裡提供基準工具，用於比較字串匹配的資料結構效能。"
                }
            },
            "https://github.com/algon-320/vime": {
                "sub_category": null,
                "repository_name": "vime",
                "user_name": "algon-320",
                "description": "Using Vim as an input method for X11 apps",
                "multilingual_descriptions": {
                    "en": "Using Vim as an input method for X11 apps",
                    "ja": "X11アプリケーションの入力方法としてVimを使用する",
                    "zh-hans": "使用Vim作为X11应用程序的输入法",
                    "zh-hant": "使用Vim作為X11應用程式的輸入法"
                }
            },
            "https://github.com/VOICEVOX/voicevox_core": {
                "sub_category": null,
                "repository_name": "voicevox_core",
                "user_name": "VOICEVOX",
                "description": "無料で使える中品質なテキスト読み上げソフトウェア、VOICEVOXのコア",
                "multilingual_descriptions": {
                    "en": "The core of VOICEVOX, a medium-quality text-to-speech software that can be used for free.",
                    "ja": "無料で使える中品質なテキスト読み上げソフトウェア、VOICEVOXのコア",
                    "zh-hans": "VOICEVOX的核心是一款中等质量的免费文本朗读软件。",
                    "zh-hant": "免費使用的中等質量的文字朗讀軟件，VOICEVOX的核心"
                }
            },
            "https://github.com/akaza-im/akaza": {
                "sub_category": null,
                "repository_name": "akaza",
                "user_name": "akaza-im",
                "description": "Yet another Japanese IME for IBus/Linux",
                "multilingual_descriptions": {
                    "en": "Yet another Japanese IME for IBus/Linux",
                    "ja": "IBus/Linux用のもう1つの日本語IME",
                    "zh-hans": "又一个适用于IBus/Linux的日语输入法",
                    "zh-hant": "又一個針對IBus/Linux的日文輸入法"
                }
            },
            "https://github.com/WeDontPanic/Jotoba": {
                "sub_category": null,
                "repository_name": "Jotoba",
                "user_name": "WeDontPanic",
                "description": "A free online, self-hostable, multilang Japanese dictionary.",
                "multilingual_descriptions": {
                    "en": "A free online, self-hostable, multilang Japanese dictionary.",
                    "ja": "無料でオンラインで自己ホスト可能な、多言語対応の日本語辞書。",
                    "zh-hans": "一个免费的在线、自托管、多语言的日语词典。",
                    "zh-hant": "一個免費的在線自主托管的多語言日語詞典。"
                }
            },
            "https://github.com/shinespark/dvorakjp-romantable": {
                "sub_category": null,
                "repository_name": "dvorakjp-romantable",
                "user_name": "shinespark",
                "description": "Google 日本語入力用DvorakJPローマ字テーブル / DvorakJP Roman Table for Google Japanese Input",
                "multilingual_descriptions": {
                    "en": "DvorakJP Roman Table for Google Japanese Input",
                    "ja": "Google日本語入力用のDvorakJPローマ字テーブル",
                    "zh-hans": "谷歌日语输入用DvorakJP罗马字表 / DvorakJP罗马字表适用于谷歌日语输入",
                    "zh-hant": "Google 日本語輸入用 DvorakJP 羅馬字表 / DvorakJP Roman Table for Google Japanese Input"
                }
            },
            "https://github.com/Netdex/niinii": {
                "sub_category": null,
                "repository_name": "niinii",
                "user_name": "Netdex",
                "description": "Japanese glossator for assisted reading of text using Ichiran",
                "multilingual_descriptions": {
                    "en": " Japanese glossator for assisted reading of text using Ichiran",
                    "ja": "一覧を使用したテキストの補助読みのための日本語の注釈者",
                    "zh-hans": "使用Ichiran辅助阅读文本的日语注释器",
                    "zh-hant": "使用一個日語注釋器來輔助閱讀文本，使用「一覧」。"
                }
            },
            "https://github.com/naokiri/cskk": {
                "sub_category": null,
                "repository_name": "cskk",
                "user_name": "naokiri",
                "description": "SKK (Simple Kana Kanji henkan) library",
                "multilingual_descriptions": {
                    "en": "SKK (Simple Kana Kanji conversion) library",
                    "ja": "出力: SKK（シンプルかな漢字変換）ライブラリ",
                    "zh-hans": "SKK（简单假名汉字转换）库",
                    "zh-hant": "SKK（簡易假名漢字轉換）程式庫"
                }
            },
            "https://github.com/tysonwu/japanki": {
                "sub_category": null,
                "repository_name": "japanki",
                "user_name": "tysonwu",
                "description": "Learn Japanese vocabs 🇯🇵 by doing quizzes on CLI!",
                "multilingual_descriptions": {
                    "en": "Learn Japanese vocabs 🇯🇵 by doing quizzes on CLI!",
                    "ja": "CLIでクイズをすることで日本語の単語を学びましょう！ 🇯🇵",
                    "zh-hans": "通过在CLI上做测验来学习日语词汇🇯🇵！",
                    "zh-hant": "通過在CLI上進行測驗來學習日語詞彙🇯🇵！"
                }
            },
            "https://github.com/jpreprocess/jpreprocess": {
                "sub_category": null,
                "repository_name": "jpreprocess",
                "user_name": "jpreprocess",
                "description": "Japanese text preprocessor for Text-to-Speech applications (OpenJTalk rewrite in rust language)",
                "multilingual_descriptions": {
                    "en": "Japanese text preprocessor for Text-to-Speech applications (OpenJTalk rewrite in rust language)",
                    "ja": "テキスト読み上げアプリケーション用の日本語テキストプリプロセッサ（Rust言語でのOpenJTalkの書き直し）",
                    "zh-hans": "用于文本转语音应用程序的日语文本预处理器（OpenJTalk在Rust语言中的重写）\n用于文本转语音应用程序的日语文本预处理器（用Rust语言重写的OpenJTalk）",
                    "zh-hant": "用於文本轉語音應用的日文文本預處理器（OpenJTalk在Rust語言中的重寫）"
                }
            },
            "https://github.com/japanese-law-analysis/listup_precedent": {
                "sub_category": null,
                "repository_name": "listup_precedent",
                "user_name": "japanese-law-analysis",
                "description": "裁判例のデータ一覧を裁判所のホームページ(https://www.courts.go.jp/index.html) をスクレイピングして生成するソフトウェア",
                "multilingual_descriptions": {
                    "en": "Software that scrapes and generates a list of case law data from the court's website (https://www.courts.go.jp/index.html)",
                    "ja": "裁判例のデータ一覧を裁判所のホームページ(https://www.courts.go.jp/index.html) をスクレイピングして生成するソフトウェア",
                    "zh-hans": "使用软件从法院网站(https://www.courts.go.jp/index.html) 爬取裁判例数据并生成数据列表。",
                    "zh-hant": "裁判例資料列表生成軟體，可透過網址(https://www.courts.go.jp/index.html) 對法院網站進行爬蟲。"
                }
            },
            "https://github.com/eagleflo/jisho": {
                "sub_category": null,
                "repository_name": "jisho",
                "user_name": "eagleflo",
                "description": "Jisho is a CLI tool & Rust library that provides a Japanese-English dictionary.",
                "multilingual_descriptions": {
                    "en": "Jisho is a CLI tool & Rust library that provides a Japanese-English dictionary.",
                    "ja": "Jishoは、日本語-英語辞書を提供するCLIツールおよびRustライブラリです。\nJishoは、日本語-英語辞書を提供するCLIツール＆Rustライブラリです。",
                    "zh-hans": "Jisho是一个提供日语-英语词典的CLI工具和Rust库。",
                    "zh-hant": "Jisho 是一個提供日英詞典的 CLI 工具和 Rust 函式庫。"
                }
            }
        },
        "JavaScript": {
            "https://github.com/takuyaa/kuromoji.js": {
                "sub_category": "Morphology analysis",
                "repository_name": "kuromoji.js",
                "user_name": "takuyaa",
                "description": "JavaScript implementation of Japanese morphological analyzer",
                "multilingual_descriptions": {
                    "en": "JavaScript implementation of Japanese morphological analyzer",
                    "ja": "日本語形態素解析器のJavaScript実装",
                    "zh-hans": "日语形态分析器的JavaScript实现",
                    "zh-hant": "日本語形態素解析器的JavaScript實現"
                }
            },
            "https://github.com/rakuten-nlp/rakutenma": {
                "sub_category": "Morphology analysis",
                "repository_name": "rakutenma",
                "user_name": "rakuten-nlp",
                "description": "morphological analyzer (word segmentor + PoS Tagger) for Chinese and Japanese written purely in JavaScript.",
                "multilingual_descriptions": {
                    "en": " Rakuten MA - morphological analyzer (word segmentor + PoS Tagger) for Chinese and Japanese written purely in JavaScript.",
                    "ja": "日本語と中国語の形態素解析器（単語分割器+品詞タガー）である「楽天MA」は、純粋にJavaScriptで書かれています。",
                    "zh-hans": "Rakuten MA - 用纯JavaScript编写的中文和日文形态分析器（词分割器+词性标注器）。",
                    "zh-hant": "Rakuten MA - 一款純粹使用 JavaScript 編寫的中日文形態分析器（詞分割器 + 詞性標記器）。"
                }
            },
            "https://github.com/golbin/node-mecab-ya": {
                "sub_category": "Morphology analysis",
                "repository_name": "node-mecab-ya",
                "user_name": "golbin",
                "description": "Yet another mecab wrapper for nodejs",
                "multilingual_descriptions": {
                    "en": "Yet another mecab wrapper for nodejs",
                    "ja": "Nodejs用の別のmecabラッパー",
                    "zh-hans": "又一个用于nodejs的mecab包装器",
                    "zh-hant": "另一個用於 Node.js 的 MeCab 封裝程式"
                }
            },
            "https://github.com/thammin/juman-bin": {
                "sub_category": "Morphology analysis",
                "repository_name": "juman-bin",
                "user_name": "thammin",
                "description": "a User-Extensible Morphological Analyzer for Japanese. 日本語形態素解析システム",
                "multilingual_descriptions": {
                    "en": "a User-Extensible Morphological Analyzer for Japanese. 日本語形態素解析システム",
                    "ja": "日本語形態素解析システムのユーザー拡張可能な解析器。",
                    "zh-hans": "一个用户可扩展的日语形态学分析器。日本语形态学分析系统。",
                    "zh-hant": "一個可擴展的日本語形態素解析器。日本語形態素解析系統。"
                }
            },
            "https://github.com/hecomi/node-mecab-async": {
                "sub_category": "Morphology analysis",
                "repository_name": "node-mecab-async",
                "user_name": "hecomi",
                "description": "Asynchronous japanese morphological analyser using MeCab.",
                "multilingual_descriptions": {
                    "en": "Asynchronous japanese morphological analyser using MeCab.",
                    "ja": "MeCabを使用した非同期日本語形態素解析器。",
                    "zh-hans": "使用MeCab的异步日语形态分析器。",
                    "zh-hant": "使用MeCab的非同步日語形態分析器。"
                }
            },
            "https://github.com/hexenq/kuroshiro": {
                "sub_category": "Converter",
                "repository_name": "kuroshiro",
                "user_name": "hexenq",
                "description": "Japanese language library for converting Japanese sentence to Hiragana, Katakana or Romaji with furigana and okurigana modes supported.",
                "multilingual_descriptions": {
                    "en": "Japanese language library for converting Japanese sentence to Hiragana, Katakana or Romaji with furigana and okurigana modes supported.",
                    "ja": "ふりがなと送り仮名モードに対応した、日本語の文章をひらがな、カタカナ、ローマ字に変換するための日本語言語ライブラリ。",
                    "zh-hans": "日语语言库，可将日语句子转换为平假名、片假名或罗马字，并支持振假名和送假名模式。",
                    "zh-hant": "日語語言庫，可將日語句子轉換為平假名、片假名或羅馬字，支持振り仮名和送り仮名模式。"
                }
            },
            "https://github.com/hexenq/kuroshiro-analyzer-kuromoji": {
                "sub_category": "Converter",
                "repository_name": "kuroshiro-analyzer-kuromoji",
                "user_name": "hexenq",
                "description": "Kuromoji morphological analyzer for kuroshiro.",
                "multilingual_descriptions": {
                    "en": "Kuromoji morphological analyzer for kuroshiro.",
                    "ja": "黒白のためのKuromoji形態素解析器。",
                    "zh-hans": "Kuroshiro 的 Kuromoji 形态分析器。",
                    "zh-hant": "Kuroshiro 的 Kuromoji 形態分析器。"
                }
            },
            "https://github.com/lovell/hepburn": {
                "sub_category": "Converter",
                "repository_name": "hepburn",
                "user_name": "lovell",
                "description": "Node.js module for converting Japanese Hiragana and Katakana script to, and from, Romaji using Hepburn romanisation",
                "multilingual_descriptions": {
                    "en": "Node.js module for converting Japanese Hiragana and Katakana script to, and from, Romaji using Hepburn romanisation",
                    "ja": "ヘボン式ローマ字による、日本語のひらがなとカタカナを相互に変換するためのNode.jsモジュール",
                    "zh-hans": "使用Hepburn罗马化将日语平假名和片假名转换为罗马字的Node.js模块。",
                    "zh-hant": "使用 Hepburn 羅馬拼音將日文平假名和片假名轉換為羅馬字的 Node.js 模組。"
                }
            },
            "https://github.com/twada/japanese-numerals-to-number": {
                "sub_category": "Converter",
                "repository_name": "japanese-numerals-to-number",
                "user_name": "twada",
                "description": "Converts Japanese Numerals into number",
                "multilingual_descriptions": {
                    "en": "Converts Japanese Numerals into number",
                    "ja": "日本の数字を数字に変換します。",
                    "zh-hans": "将日语数字转换为阿拉伯数字",
                    "zh-hant": "將日本數字轉換為數字"
                }
            },
            "https://github.com/kariminf/jslingua": {
                "sub_category": "Converter",
                "repository_name": "jslingua",
                "user_name": "kariminf",
                "description": "Javascript libraries to process text: Arabic, Japanese, etc.",
                "multilingual_descriptions": {
                    "en": "Javascript libraries for text processing: Arabic, Japanese, and more.",
                    "ja": "テキストを処理するためのJavascriptライブラリ：アラビア語、日本語など。",
                    "zh-hans": "处理文本的Javascript库：阿拉伯语、日语等。",
                    "zh-hant": "處理文本的Javascript庫：阿拉伯語，日語等。"
                }
            },
            "https://github.com/WaniKani/WanaKana": {
                "sub_category": "Converter",
                "repository_name": "WanaKana",
                "user_name": "WaniKani",
                "description": "Javascript library for detecting and transliterating Hiragana <--> Katakana <--> Romaji",
                "multilingual_descriptions": {
                    "en": "A Javascript library that can detect and transliterate between Hiragana, Katakana, and Romaji.",
                    "ja": "ひらがな<-->カタカナ<-->ローマ字の検出と転写のためのJavascriptライブラリ",
                    "zh-hans": "用于检测和转换平假名<-->片假名<-->罗马字的Javascript库",
                    "zh-hant": "JavaScript 庫，用於檢測和轉寫平假名 <--> 片假名 <--> 羅馬字。"
                }
            },
            "https://github.com/jeresig/node-romaji-name": {
                "sub_category": "Converter",
                "repository_name": "node-romaji-name",
                "user_name": "jeresig",
                "description": "Normalize and fix common issues with Romaji-based Japanese names.",
                "multilingual_descriptions": {
                    "en": "Normalize and fix common issues with Romaji-based Japanese names.",
                    "ja": "ローマ字表記の日本人名における一般的な問題を正規化し修正する。",
                    "zh-hans": "规范和修复基于罗马字的日本姓名中常见的问题。",
                    "zh-hant": "將基於羅馬字的日本名字進行標準化和修復常見問題。"
                }
            },
            "https://github.com/hakatashi/kyujitai.js": {
                "sub_category": "Converter",
                "repository_name": "kyujitai.js",
                "user_name": "hakatashi",
                "description": "Utility collections for making Japanese text old-fashioned",
                "multilingual_descriptions": {
                    "en": "Utility collections for making Japanese text old-fashioned",
                    "ja": "日本語のテキストを古風にするためのユーティリティコレクション",
                    "zh-hans": "用于使日文文本老式化的实用集合",
                    "zh-hant": "製作日本古風文本的實用集合"
                }
            },
            "https://github.com/geolonia/normalize-japanese-addresses": {
                "sub_category": "Converter",
                "repository_name": "normalize-japanese-addresses",
                "user_name": "geolonia",
                "description": "オープンソースの住所正規化ライブラリ。",
                "multilingual_descriptions": {
                    "en": "Open source address normalization library.",
                    "ja": "オープンソースの住所正規化ライブラリ。",
                    "zh-hans": "开源地址规范化库。",
                    "zh-hant": "開源的地址規範化程式庫。"
                }
            },
            "https://github.com/kazuhikoarase/jaconv": {
                "sub_category": "Converter",
                "repository_name": "jaconv",
                "user_name": "kazuhikoarase",
                "description": "日本語文字変換ライブラリ (javascript)",
                "multilingual_descriptions": {
                    "en": "Japanese text conversion library (javascript)",
                    "ja": "日本語文字変換ライブラリ (javascript)",
                    "zh-hans": "日本语文字转换库（javascript）",
                    "zh-hant": "日本語文字轉換程式庫 (javascript)"
                }
            },
            "https://github.com/koozaki/romaji-conv": {
                "sub_category": "Converter",
                "repository_name": "romaji-conv",
                "user_name": "koozaki",
                "description": "Convert romaji into hiragana",
                "multilingual_descriptions": {
                    "en": "Convert romaji into hiragana",
                    "ja": "ローマ字をひらがなに変換する",
                    "zh-hans": "将罗马字转换为平假名",
                    "zh-hant": "將羅馬字轉換為平假名"
                }
            },
            "https://github.com/geolonia/japanese-addresses-v2": {
                "sub_category": "Converter",
                "repository_name": "japanese-addresses-v2",
                "user_name": "geolonia",
                "description": "全国の住所データAPI",
                "multilingual_descriptions": {
                    "en": "National address data API",
                    "ja": "全国の住所データAPI",
                    "zh-hans": "全国住址数据API",
                    "zh-hant": "全國的地址數據API"
                }
            },
            "https://github.com/elzup/jptext-to-emoji": {
                "sub_category": "Converter",
                "repository_name": "jptext-to-emoji",
                "user_name": "elzup",
                "description": "テキストの単語を絵文字に変換する",
                "multilingual_descriptions": {
                    "en": "Convert text words to emojis",
                    "ja": "テキストの単語を絵文字に変換する",
                    "zh-hans": "将文本单词转换为表情符号",
                    "zh-hant": "將文字單詞轉換為表情符號"
                }
            },
            "https://github.com/bangumi-data/bangumi-data": {
                "sub_category": null,
                "repository_name": "bangumi-data",
                "user_name": "bangumi-data",
                "description": "Raw data for Japanese Anime",
                "multilingual_descriptions": {
                    "en": "生データーの日本のアニメについて",
                    "ja": "日本のアニメの生データ",
                    "zh-hans": "日本动漫的原始数据",
                    "zh-hant": "日本動畫的原始數據"
                }
            },
            "https://github.com/FooSoft/yomichan": {
                "sub_category": null,
                "repository_name": "yomichan",
                "user_name": "FooSoft",
                "description": "Japanese pop-up dictionary extension for Chrome and Firefox.",
                "multilingual_descriptions": {
                    "en": "Japanese pop-up dictionary extension for Chrome and Firefox.",
                    "ja": "ChromeとFirefox用の日本語ポップアップ辞書拡張機能。",
                    "zh-hans": "Chrome和Firefox的日语弹出式词典扩展。",
                    "zh-hant": "Chrome和Firefox的日語彈出詞典擴展。"
                }
            },
            "https://github.com/gecko655/proofreading-tool": {
                "sub_category": null,
                "repository_name": "proofreading-tool",
                "user_name": "gecko655",
                "description": "GUIで動作する文書校正ツール GUI tool for textlinting.",
                "multilingual_descriptions": {
                    "en": "GUIで動作する文書校正ツール GUI tool for textlinting.",
                    "ja": "テキストリントツールのGUIツール",
                    "zh-hans": "GUI工具，用于文本校对。",
                    "zh-hant": "GUI工具，用於文本校對。"
                }
            },
            "https://github.com/minosvasilias/kanjigrid": {
                "sub_category": null,
                "repository_name": "kanjigrid",
                "user_name": "minosvasilias",
                "description": "A web-app displaying the 2200 kanji characters taught in James Heisig's \"Remembering the Kanji\", 6th edition.",
                "multilingual_descriptions": {
                    "en": "A web-app displaying the 2200 kanji characters taught in James Heisig's \"Remembering the Kanji\", 6th edition.",
                    "ja": "「Remembering the Kanji」第6版で教えられる2200の漢字を表示するウェブアプリ。",
                    "zh-hans": "一个网页应用程序，展示了《记忆汉字》第六版中教授的2200个汉字。",
                    "zh-hant": "一個網頁應用程式，顯示詹姆斯·海西格《漢字憶起》第六版所教授的2200個漢字。"
                }
            },
            "https://github.com/echamudi/japanese-toolkit": {
                "sub_category": null,
                "repository_name": "japanese-toolkit",
                "user_name": "echamudi",
                "description": "Monorepo for Kanji, Furigana, Japanese DB, and others",
                "multilingual_descriptions": {
                    "en": "Monorepo for Kanji, Furigana, Japanese DB, and others",
                    "ja": "漢字、ふりがな、日本語DBなどのためのモノレポ",
                    "zh-hans": "单一代码库用于汉字、假名、日语数据库等其他内容。",
                    "zh-hant": "單一存儲庫用於漢字、假名、日語數據庫等。"
                }
            },
            "https://github.com/textlint-ja/analyze-desumasu-dearu": {
                "sub_category": null,
                "repository_name": "analyze-desumasu-dearu",
                "user_name": "textlint-ja",
                "description": "文の敬体(ですます調)、常体(である調)を解析するJavaScriptライブラリ",
                "multilingual_descriptions": {
                    "en": "A JavaScript library for analyzing polite language (desu-masu style) and plain language (da-aru style) in sentences.",
                    "ja": "文の敬体(ですます調)、常体(である調)を解析するJavaScriptライブラリ",
                    "zh-hans": "解析敬体（ですます语气）和常体（である语气）的JavaScript库。",
                    "zh-hant": "解析敬體（敬語）和常體（平語）的JavaScript程式庫"
                }
            },
            "https://github.com/DJTB/hatsuon": {
                "sub_category": null,
                "repository_name": "hatsuon",
                "user_name": "DJTB",
                "description": "Japanese pitch accent utils",
                "multilingual_descriptions": {
                    "en": "Japanese pitch accent utils",
                    "ja": "日本語のアクセントユーティリティ",
                    "zh-hans": "日语声调工具",
                    "zh-hant": "日語音高工具"
                }
            },
            "https://github.com/otodn/sentiment_ja_js": {
                "sub_category": null,
                "repository_name": "sentiment_ja_js",
                "user_name": "otodn",
                "description": "Sentiment Analysis in Japanese. sentiment_ja with JavaScript",
                "multilingual_descriptions": {
                    "en": "Sentiment Analysis in Japanese. sentiment_ja with JavaScript",
                    "ja": "日本語の感情分析。JavaScriptでsentiment_ja。",
                    "zh-hans": "使用JavaScript进行日语情感分析，使用sentiment_ja。",
                    "zh-hant": "使用JavaScript進行日語情感分析，sentiment_ja。"
                }
            },
            "https://github.com/takuyaa/mecab-ipadic-seed": {
                "sub_category": null,
                "repository_name": "mecab-ipadic-seed",
                "user_name": "takuyaa",
                "description": "mecab-ipadic seed dictionary reader",
                "multilingual_descriptions": {
                    "en": "mecab-ipadic seed dictionary reader",
                    "ja": "mecab-ipadicのシード辞書リーダー",
                    "zh-hans": "mecab-ipadic 种子词典阅读器",
                    "zh-hant": "mecab-ipadic種子詞典閱讀器"
                }
            },
            "https://github.com/LuanRT/Japanese-Word-Of-The-Day": {
                "sub_category": null,
                "repository_name": "Japanese-Word-Of-The-Day",
                "user_name": "LuanRT",
                "description": "Well, a different Japanese word everyday.",
                "multilingual_descriptions": {
                    "en": "Well, a different Japanese word everyday.",
                    "ja": "毎日違う日本語の単語。",
                    "zh-hans": "每天一个不同的日语单词。",
                    "zh-hant": "每天一個不同的日語單詞。"
                }
            },
            "https://github.com/esrille/oskim": {
                "sub_category": null,
                "repository_name": "oskim",
                "user_name": "esrille",
                "description": "Extend GNOME On-Screen Keyboard for Input Methods",
                "multilingual_descriptions": {
                    "en": "Extend GNOME On-Screen Keyboard for Input Methods",
                    "ja": "入力方法のためにGNOMEオンスクリーンキーボードを拡張する",
                    "zh-hans": "扩展GNOME屏幕键盘以支持输入法",
                    "zh-hant": "擴展 GNOME 螢幕鍵盤以支援輸入法"
                }
            },
            "https://github.com/wtnv-lab/tweetMapping": {
                "sub_category": null,
                "repository_name": "tweetMapping",
                "user_name": "wtnv-lab",
                "description": "東日本大震災発生から24時間以内につぶやかれたジオタグ付きツイートのデジタルアーカイブです。",
                "multilingual_descriptions": {
                    "en": "This is a digital archive of geotagged tweets that were tweeted within 24 hours of the occurrence of the Great East Japan Earthquake.",
                    "ja": "東日本大震災発生から24時間以内につぶやかれたジオタグ付きツイートのデジタルアーカイブです。",
                    "zh-hans": "这是一个带有地理标签的推文数字档案，记录了发生在东日本大地震后24小时内发布的推文。",
                    "zh-hant": "這是東日本大地震發生後24小時內帶有地理標籤的推文的數字檔案。"
                }
            },
            "https://github.com/shirakaba/pitch-accent": {
                "sub_category": null,
                "repository_name": "pitch-accent",
                "user_name": "shirakaba",
                "description": "Predict pitch accent in Japanese",
                "multilingual_descriptions": {
                    "en": "Predict pitch accent in Japanese",
                    "ja": "日本語のアクセントを予測する",
                    "zh-hans": "预测日语的声调重音",
                    "zh-hant": "預測日語的音高重音"
                }
            },
            "https://github.com/amanoese/kana2ipa": {
                "sub_category": null,
                "repository_name": "kana2ipa",
                "user_name": "amanoese",
                "description": "「ひらがな」または「カタカナ」を日本語で発音する際の音声記号(IPA)に変換するコマンド",
                "multilingual_descriptions": {
                    "en": "Command to convert \"hiragana\" or \"katakana\" into International Phonetic Alphabet (IPA) symbols when pronouncing in Japanese.",
                    "ja": "「ひらがな」または「カタカナ」を日本語で発音する際の音声記号(IPA)に変換するコマンド",
                    "zh-hans": "将「ひらがな」或「カタカナ」转换为日语发音时的音标(IPA)的命令。",
                    "zh-hant": "將「ひらがな」或「カタカナ」轉換為日語發音時的音標(IPA)的指令"
                }
            },
            "https://github.com/VOICEVOX/voicevox": {
                "sub_category": null,
                "repository_name": "voicevox",
                "user_name": "VOICEVOX",
                "description": "無料で使える中品質なテキスト読み上げソフトウェア、VOICEVOXのエディター",
                "multilingual_descriptions": {
                    "en": "Editor for VOICEVOX, a high-quality text-to-speech software that can be used for free.",
                    "ja": "無料で使える中品質なテキスト読み上げソフトウェア、VOICEVOXのエディター",
                    "zh-hans": "免费使用的中等质量的文本朗读软件，VOICEVOX的编辑器",
                    "zh-hant": "免費使用的中等品質文字朗讀軟體，VOICEVOX的編輯器"
                }
            },
            "https://github.com/fasiha/kamiya-codec": {
                "sub_category": null,
                "repository_name": "kamiya-codec",
                "user_name": "fasiha",
                "description": "Towards a Japanese verb conjugator and deconjugator based on Taeko Kamiya's *The Handbook of Japanese Verbs* and *The Handbook of Japanese Adjectives and Adverbs* opuses.",
                "multilingual_descriptions": {
                    "en": "Towards a Japanese verb conjugator and deconjugator based on Taeko Kamiya's *The Handbook of Japanese Verbs* and *The Handbook of Japanese Adjectives and Adverbs* opuses.",
                    "ja": "日本語動詞の活用と非活用を基にした神谷妙子の「日本語動詞の手引き」と「日本語形容詞・副詞の手引き」に向けて。",
                    "zh-hans": "基于神谷多恵子的《日本动词手册》和《日本形容词和副词手册》，开发一个日语动词变位器和去变位器。",
                    "zh-hant": "根據神谷多恵子的《日本動詞手冊》和《日本形容詞和副詞手冊》，開發一個日語動詞變化器和去變化器。"
                }
            }
        },
        "Go": {
            "https://github.com/ikawaha/kagome": {
                "sub_category": "Morphology analysis",
                "repository_name": "kagome",
                "user_name": "ikawaha",
                "description": "Self-contained Japanese Morphological Analyzer written in pure Go",
                "multilingual_descriptions": {
                    "en": "Self-contained Japanese Morphological Analyzer written in pure Go",
                    "ja": "純粋なGoで書かれた自己完結型の日本語形態素解析器",
                    "zh-hans": "用纯Go编写的自包含日语形态分析器",
                    "zh-hant": "純Go編寫的自包含日語形態分析器"
                }
            },
            "https://github.com/jiro4989/ojosama": {
                "sub_category": null,
                "repository_name": "ojosama",
                "user_name": "jiro4989",
                "description": "テキストを壱百満天原サロメお嬢様風の口調に変換します",
                "multilingual_descriptions": {
                    "en": "Converts text into the tone of Lady Salome from the Hundred Celestial Plains.",
                    "ja": "テキストを壱百満天原サロメお嬢様風の口調に変換します",
                    "zh-hans": "将文本转换为百万天原萨洛梅小姐风格的口吻。",
                    "zh-hant": "將文字轉換為百滿天原薩洛美小姐風格的口吻。"
                }
            },
            "https://github.com/gojp/nihongo": {
                "sub_category": null,
                "repository_name": "nihongo",
                "user_name": "gojp",
                "description": "Japanese Dictionary",
                "multilingual_descriptions": {
                    "en": "Japanese Dictionary",
                    "ja": "日本語辞書",
                    "zh-hans": "日语词典",
                    "zh-hant": "日本語詞典"
                }
            },
            "https://github.com/FooSoft/yomichan-import": {
                "sub_category": null,
                "repository_name": "yomichan-import",
                "user_name": "FooSoft",
                "description": "External dictionary importer for Yomichan.",
                "multilingual_descriptions": {
                    "en": "External dictionary importer for Yomichan.",
                    "ja": "Yomichan用の外部辞書インポーター。",
                    "zh-hans": "Yomichan的外部词典导入器。",
                    "zh-hant": "Yomichan 的外部詞典導入工具。"
                }
            },
            "https://github.com/maruamyu/imas-ime-dic": {
                "sub_category": null,
                "repository_name": "imas-ime-dic",
                "user_name": "maruamyu",
                "description": "THE IDOLM@STER words dictionary for Japanese IME (by imas-db.jp)",
                "multilingual_descriptions": {
                    "en": "THE IDOLM@STER words dictionary for Japanese IME (by imas-db.jp)",
                    "ja": "アイドルマスターの言葉辞書（imas-db.jpによる日本語IME用）",
                    "zh-hans": "《偶像大师》日语输入法词典（由imas-db.jp提供）",
                    "zh-hant": "THE IDOLM@STER 日文輸入法詞彙表（由imas-db.jp提供）"
                }
            },
            "https://github.com/sarumaj/go-kakasi": {
                "sub_category": null,
                "repository_name": "go-kakasi",
                "user_name": "sarumaj",
                "description": "Kanji transliteration to hiragana/katakana/romaji, in Go",
                "multilingual_descriptions": {
                    "en": "Kanji 転写 to hiragana/katakana/romaji, in Go",
                    "ja": "Goで漢字の読み仮名/片仮名/ローマ字に変換",
                    "zh-hans": "汉字转换为平假名/片假名/罗马字母，在围棋游戏中",
                    "zh-hant": "在Go中將漢字音譯為平假名/片假名/羅馬字\n將漢字音譯為平假名/片假名/羅馬字，在Go中"
                }
            },
            "https://github.com/ktnyt/go-moji": {
                "sub_category": null,
                "repository_name": "go-moji",
                "user_name": "ktnyt",
                "description": "A Go library for Zenkaku/Hankaku conversion",
                "multilingual_descriptions": {
                    "en": "A Go library for Zenkaku/Hankaku conversion",
                    "ja": "全角/半角変換のためのGoライブラリ",
                    "zh-hans": "一个用于全角/半角转换的Go库",
                    "zh-hant": "一個用於全角/半角轉換的 Go 函式庫"
                }
            },
            "https://github.com/greymd/ojichat": {
                "sub_category": null,
                "repository_name": "ojichat",
                "user_name": "greymd",
                "description": "おじさんがLINEやメールで送ってきそうな文を生成する",
                "multilingual_descriptions": {
                    "en": "Generate sentences that an uncle would send via LINE or email.",
                    "ja": "おじさんがLINEやメールで送ってきそうな文を生成する",
                    "zh-hans": "生成一个似乎是叔叔通过LINE或邮件发送的句子。",
                    "zh-hant": "生成一些看起来像叔叔会通过LINE或邮件发送的文本"
                }
            },
            "https://github.com/kuniwak/name": {
                "sub_category": null,
                "repository_name": "name",
                "user_name": "kuniwak",
                "description": "Name Searcher in Japanese",
                "multilingual_descriptions": {
                    "en": "名前検索者",
                    "ja": "日本語の名前検索者",
                    "zh-hans": "日语姓名搜索器",
                    "zh-hant": "日本名稱搜索器"
                }
            }
        },
        "Java": {
            "https://github.com/atilika/kuromoji": {
                "sub_category": "Morphology analysis",
                "repository_name": "kuromoji",
                "user_name": "atilika",
                "description": "Kuromoji is a self-contained and very easy to use Japanese morphological analyzer designed for search",
                "multilingual_descriptions": {
                    "en": "Kuromoji is a self-contained and very easy to use Japanese morphological analyzer designed for search",
                    "ja": "Kuromojiは、検索用に設計された自己完結型で非常に使いやすい日本語形態素解析器です。",
                    "zh-hans": "Kuromoji是一个自包含且非常易于使用的日语形态分析器，专为搜索而设计。",
                    "zh-hant": "Kuromoji是一個自包含且非常易於使用的日語形態分析器，專為搜索而設計。"
                }
            },
            "https://github.com/WorksApplications/SudachiDict": {
                "sub_category": "Morphology analysis",
                "repository_name": "SudachiDict",
                "user_name": "WorksApplications",
                "description": "A lexicon for Sudachi",
                "multilingual_descriptions": {
                    "en": "A lexicon for Sudachi",
                    "ja": "すだちの語彙集",
                    "zh-hans": "一个Sudachi词汇表",
                    "zh-hant": "Sudachi詞彙表"
                }
            },
            "https://github.com/teru-oka-1933/meval": {
                "sub_category": "Morphology analysis",
                "repository_name": "meval",
                "user_name": "teru-oka-1933",
                "description": "形態素解析器性能評価システム MevAL",
                "multilingual_descriptions": {
                    "en": "Morphological analyzer performance evaluation system MevAL",
                    "ja": "形態素解析器性能評価システム MevAL",
                    "zh-hans": "形态素解析器性能评估系统 MevAL",
                    "zh-hant": "形態素解析器性能評估系統 MevAL"
                }
            },
            "https://github.com/sakarika/kanjitomo-ocr": {
                "sub_category": null,
                "repository_name": "kanjitomo-ocr",
                "user_name": "sakarika",
                "description": "Java library for identifying Japanese characters from images",
                "multilingual_descriptions": {
                    "en": "Java library for identifying Japanese characters from images",
                    "ja": "画像から日本語文字を識別するためのJavaライブラリ",
                    "zh-hans": "用于从图像中识别日语字符的Java库",
                    "zh-hant": "從圖像中識別日文字符的Java庫"
                }
            },
            "https://github.com/nicolas-raoul/jakaroma": {
                "sub_category": null,
                "repository_name": "jakaroma",
                "user_name": "nicolas-raoul",
                "description": "Java library and command-line tool to transliterate Japanese kanji to romaji (Latin alphabet)",
                "multilingual_descriptions": {
                    "en": "Java library and command-line tool to transliterate Japanese kanji to romaji (Latin alphabet)",
                    "ja": "日本語の漢字をローマ字（ラテンアルファベット）に変換するためのJavaライブラリとコマンドラインツール。",
                    "zh-hans": "将日语汉字转换为罗马字（拉丁字母）的Java库和命令行工具。",
                    "zh-hant": "將日本漢字轉換為羅馬字（拉丁字母）的Java庫和命令行工具"
                }
            },
            "https://github.com/nicolas-raoul/kakasi-java": {
                "sub_category": null,
                "repository_name": "kakasi-java",
                "user_name": "nicolas-raoul",
                "description": "Kanji transliteration to hiragana/katakana/romaji, in Java",
                "multilingual_descriptions": {
                    "en": "Kanji transliteration to hiragana/katakana/romaji, in Java",
                    "ja": "Javaにおける漢字のひらがな/カタカナ/ローマ字への転写",
                    "zh-hans": "Java中的汉字音译为平假名/片假名/罗马字。",
                    "zh-hant": "Java中的漢字轉假名/片假名/羅馬字輸出"
                }
            },
            "https://github.com/fauu/Kamite": {
                "sub_category": null,
                "repository_name": "Kamite",
                "user_name": "fauu",
                "description": "A desktop language immersion companion for learners of Japanese",
                "multilingual_descriptions": {
                    "en": "A desktop language immersion companion for learners of Japanese",
                    "ja": "日本語学習者のためのデスクトップ言語浸透コンパニオン",
                    "zh-hans": "一款桌面语言沉浸式伴侣，适用于学习日语的学习者。",
                    "zh-hant": "一款桌面式的日語學習輔助工具"
                }
            },
            "https://github.com/craftzdog/react-native-japanese-tokenizer": {
                "sub_category": null,
                "repository_name": "react-native-japanese-tokenizer",
                "user_name": "craftzdog",
                "description": "Async Japanese Tokenizer Native Plugin for React Native for iOS and Android",
                "multilingual_descriptions": {
                    "en": "Async Japanese Tokenizer Native Plugin for React Native for iOS and Android",
                    "ja": "React Native用の非同期日本語トークナイザーネイティブプラグイン（iOSおよびAndroid用）",
                    "zh-hans": "React Native异步日语分词原生插件，适用于iOS和Android。",
                    "zh-hant": "React Native 的非同步日本語分詞原生插件，適用於 iOS 和 Android。"
                }
            },
            "https://github.com/suguru/elasticsearch-analysis-japanese": {
                "sub_category": null,
                "repository_name": "elasticsearch-analysis-japanese",
                "user_name": "suguru",
                "description": "Japanese analyzer uses kuromoji japanese tokenizer for ElasticSearch",
                "multilingual_descriptions": {
                    "en": "The Japanese analyzer utilizes the Kuromoji Japanese tokenizer for ElasticSearch.",
                    "ja": "日本語アナライザーは、ElasticSearch用にkuromoji日本語トークナイザーを使用しています。",
                    "zh-hans": "日本分析器使用ElasticSearch的kuromoji日本分词器。",
                    "zh-hant": "日本語分析器使用Kuromoji日本語分詞器進行ElasticSearch。"
                }
            },
            "https://github.com/andree-surya/moji4j": {
                "sub_category": null,
                "repository_name": "moji4j",
                "user_name": "andree-surya",
                "description": "A Java library to converts between Japanese Hiragana, Katakana, and Romaji scripts.",
                "multilingual_descriptions": {
                    "en": "A Java library to converts between Japanese Hiragana, Katakana, and Romaji scripts.",
                    "ja": "日本語のひらがな、カタカナ、ローマ字のスクリプト間を変換するためのJavaライブラリ。",
                    "zh-hans": "一个Java库，用于在日语平假名、片假名和罗马字之间进行转换。",
                    "zh-hant": "一個Java庫，可在日文平假名、片假名和羅馬字之間進行轉換。"
                }
            },
            "https://github.com/ikegami-yukino/neologdn-java": {
                "sub_category": null,
                "repository_name": "neologdn-java",
                "user_name": "ikegami-yukino",
                "description": "Japanese text normalizer for mecab-neologd",
                "multilingual_descriptions": {
                    "en": "Japanese text normalizer for mecab-neologd",
                    "ja": "mecab-neologd用の日本語テキスト正規化ツール",
                    "zh-hans": "针对mecab-neologd的日语文本规范化工具",
                    "zh-hant": "mecab-neologd 的日文文本正規化工具"
                }
            },
            "https://github.com/worksapplications/elasticsearch-sudachi": {
                "sub_category": null,
                "repository_name": "elasticsearch-sudachi",
                "user_name": "worksapplications",
                "description": "The Japanese analysis plugin for elasticsearch",
                "multilingual_descriptions": {
                    "en": "The Japanese analysis plugin for elasticsearch",
                    "ja": "Elasticsearchのための日本語解析プラグイン",
                    "zh-hans": "日本的elasticsearch分析插件",
                    "zh-hant": "日本的elasticsearch分析插件"
                }
            }
        },
        "Pretrained model": {
            "https://github.com/philipperemy/japanese-words-to-vectors": {
                "sub_category": "Word2Vec",
                "repository_name": "japanese-words-to-vectors",
                "user_name": "philipperemy",
                "description": "Word2vec (word to vectors) approach for Japanese language using Gensim and Mecab.",
                "multilingual_descriptions": {
                    "en": "Word2vec (word to vectors) approach for Japanese language using Gensim and Mecab.",
                    "ja": "GensimとMecabを使用した日本語のWord2vec（単語からベクトルへのアプローチ）手法。",
                    "zh-hans": "使用Gensim和Mecab的Word2vec（单词到向量）方法来处理日语。",
                    "zh-hant": "使用Gensim和Mecab的日語Word2vec（單詞到向量）方法。"
                }
            },
            "https://github.com/WorksApplications/chiVe": {
                "sub_category": "Word2Vec",
                "repository_name": "chiVe",
                "user_name": "WorksApplications",
                "description": "Japanese word embedding with Sudachi and NWJC",
                "multilingual_descriptions": {
                    "en": "Japanese word embedding with Sudachi and NWJC",
                    "ja": "SudachiとNWJCを使用した日本語の単語埋め込み。",
                    "zh-hans": "使用Sudachi和NWJC的日语词嵌入",
                    "zh-hant": "使用Sudachi和NWJC的日語詞嵌入"
                }
            },
            "https://github.com/cl-tohoku/elmo-japanese": {
                "sub_category": "Word2Vec",
                "repository_name": "elmo-japanese",
                "user_name": "cl-tohoku",
                "description": "elmo-japanese",
                "multilingual_descriptions": {
                    "en": "Elmo (in Japanese)",
                    "ja": "エルモ-日本語",
                    "zh-hans": "艾尔莫-日语",
                    "zh-hant": "艾摩日文"
                }
            },
            "https://github.com/yagays/embedrank": {
                "sub_category": "Word2Vec",
                "repository_name": "embedrank",
                "user_name": "yagays",
                "description": "Python Implementation of EmbedRank",
                "multilingual_descriptions": {
                    "en": "Python Implementation of EmbedRank",
                    "ja": "EmbedRankのPython実装",
                    "zh-hans": "EmbedRank的Python实现",
                    "zh-hant": "EmbedRank 的 Python 實現"
                }
            },
            "https://github.com/eggplants/aovec": {
                "sub_category": "Word2Vec",
                "repository_name": "aovec",
                "user_name": "eggplants",
                "description": "青空文庫全書籍のWord2Vecビルダー+構築済みモデル",
                "multilingual_descriptions": {
                    "en": "Easy aozorabunko Word2Vec Builder - Word2Vec Builder and pre-built model for all books in the Aozora Bunko library.",
                    "ja": "簡単な青空文庫のWord2Vecビルダー - 青空文庫の全書籍を対象としたWord2Vecモデルの構築と構築済みモデル",
                    "zh-hans": "易用的青空文库Word2Vec构建器 - 包含所有书籍的Word2Vec构建器和预先构建的模型。",
                    "zh-hant": "簡易青空文庫Word2Vec建構器 - 青空文庫全書籍的Word2Vec建構器+已建構模型"
                }
            },
            "https://github.com/lapras-inc/dependency-based-japanese-word-embeddings": {
                "sub_category": "Word2Vec",
                "repository_name": "dependency-based-japanese-word-embeddings",
                "user_name": "lapras-inc",
                "description": "This is a repository for the AI LAB article \"係り受けに基づく日本語単語埋込 (Dependency-based Japanese Word Embeddings)\" ( Article URL https://ai-lab.lapras.com/nlp/japanese-word-embedding/)",
                "multilingual_descriptions": {
                    "en": "This is a repository for the AI LAB article \"係り受けに基づく日本語単語埋込 (Dependency-based Japanese Word Embeddings)\" ( Article URL https://ai-lab.lapras.com/nlp/japanese-word-embedding/)",
                    "ja": "これはAI LABの記事「係り受けに基づく日本語単語埋込 (Dependency-based Japanese Word Embeddings)」のリポジトリです。（記事URL https://ai-lab.lapras.com/nlp/japanese-word-embedding/）",
                    "zh-hans": "这是AI LAB文章“係り受けに基づく日本語単語埋込（基于依存关系的日语词嵌入）”的存储库（文章网址https://ai-lab.lapras.com/nlp/japanese-word-embedding/）。",
                    "zh-hant": "這是 AI LAB 文章「係り受けに基づく日本語単語埋込 (Dependency-based Japanese Word Embeddings)」的儲存庫 (文章網址 https://ai-lab.lapras.com/nlp/japanese-word-embedding/)。"
                }
            },
            "https://github.com/wikiwikification/jawikivec": {
                "sub_category": "Word2Vec",
                "repository_name": "jawikivec",
                "user_name": "wikiwikification",
                "description": "Yet Another Japanese-Wikipedia Entity Vectors",
                "multilingual_descriptions": {
                    "en": "Yet Another Japanese-Wikipedia Entity Vectors",
                    "ja": "もう一つの日本語ウィキペディアエンティティベクトル",
                    "zh-hans": "又一个日语维基百科实体向量",
                    "zh-hant": "另一個日本維基百科實體向量"
                }
            },
            "https://github.com/kamigaito/jawiki_word_vector_updater": {
                "sub_category": "Word2Vec",
                "repository_name": "jawiki_word_vector_updater",
                "user_name": "kamigaito",
                "description": "最新の日本語Wikipediaのダンプデータから，MeCabを用いてIPA辞書と最新のNeologd辞書の両方で形態素解析を実施し，その結果に基づいた word2vec，fastText，GloVeの単語分散表現を学習するためのスクリプト",
                "multilingual_descriptions": {
                    "en": "A script for learning word embedding models such as word2vec, fastText, and GloVe based on the results of morphological analysis using both the IPA dictionary and the latest Neologd dictionary, using MeCab on the latest Japanese Wikipedia dump data.",
                    "ja": "最新の日本語Wikipediaのダンプデータから，MeCabを用いてIPA辞書と最新のNeologd辞書の両方で形態素解析を実施し，その結果に基づいた word2vec，fastText，GloVeの単語分散表現を学習するためのスクリプト",
                    "zh-hans": "使用最新的日本语Wikipedia转储数据，使用MeCab在IPA词典和最新的Neologd词典中进行形态分析，并基于其结果学习word2vec、fastText和GloVe的词向量表示的脚本。",
                    "zh-hant": "從最新的日本語Wikipedia傾印數據中，使用MeCab在IPA詞典和最新的Neologd詞典中進行形態素分析，並基於該結果學習word2vec、fastText和GloVe的詞向量表示的腳本。"
                }
            },
            "https://github.com/cl-tohoku/bert-japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "bert-japanese",
                "user_name": "cl-tohoku",
                "description": "BERT models for Japanese text.",
                "multilingual_descriptions": {
                    "en": "BERT models for Japanese language text.",
                    "ja": "日本語テキスト用のBERTモデル。",
                    "zh-hans": "用于日语文本的BERT模型。",
                    "zh-hant": "日文文本的BERT模型。"
                }
            },
            "https://github.com/rinnakk/japanese-pretrained-models": {
                "sub_category": "Transformer based models",
                "repository_name": "japanese-pretrained-models",
                "user_name": "rinnakk",
                "description": "Code for producing Japanese pretrained models provided by rinna Co., Ltd.",
                "multilingual_descriptions": {
                    "en": "Code for producing Japanese pretrained models provided by rinna Co., Ltd.",
                    "ja": "りんな株式会社が提供する日本語事前学習モデルのコードを入力してください。",
                    "zh-hans": "rinna有限公司提供的生成日语预训练模型的代码。",
                    "zh-hant": "由rinna株式會社提供的生成日語預訓練模型的代碼。"
                }
            },
            "https://github.com/yoheikikuta/bert-japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "bert-japanese",
                "user_name": "yoheikikuta",
                "description": "BERT with SentencePiece for Japanese text.",
                "multilingual_descriptions": {
                    "en": "BERT with SentencePiece for Japanese text.",
                    "ja": "日本語テキスト用のSentencePieceを使用したBERT。",
                    "zh-hans": "使用SentencePiece的BERT模型用于日语文本。",
                    "zh-hant": "使用SentencePiece的BERT模型進行日文文本處理。"
                }
            },
            "https://github.com/WorksApplications/SudachiTra": {
                "sub_category": "Transformer based models",
                "repository_name": "SudachiTra",
                "user_name": "WorksApplications",
                "description": "Japanese tokenizer for Transformers",
                "multilingual_descriptions": {
                    "en": "日本語のトークナイザー（分かち書きツール）のためのTransformers",
                    "ja": "トランスフォーマー用の日本語トークナイザー",
                    "zh-hans": "用于变形金刚的日语分词器",
                    "zh-hant": "Transformer 的日語分詞器"
                }
            },
            "https://github.com/nttcslab/japanese-dialog-transformers": {
                "sub_category": "Transformer based models",
                "repository_name": "japanese-dialog-transformers",
                "user_name": "nttcslab",
                "description": "Code for evaluating Japanese pretrained models provided by NTT Ltd.",
                "multilingual_descriptions": {
                    "en": "Code for evaluating Japanese pretrained models provided by NTT Ltd.",
                    "ja": "NTT株式会社が提供する日本語事前学習モデルの評価コード。",
                    "zh-hans": "NTT有提供用于评估日语预训练模型的代码。",
                    "zh-hant": "NTT有限公司提供的評估日語預訓練模型的代碼。"
                }
            },
            "https://github.com/octanove/shiba": {
                "sub_category": "Transformer based models",
                "repository_name": "shiba",
                "user_name": "octanove",
                "description": "Pytorch implementation and pre-trained Japanese model for CANINE, the efficient character-level transformer.",
                "multilingual_descriptions": {
                    "en": "Pytorch implementation and pre-trained Japanese model for CANINE, the efficient character-level transformer.",
                    "ja": "CANINE、効率的な文字レベルトランスフォーマーのPytorch実装と事前学習済みの日本語モデル。",
                    "zh-hans": "CANINE是一种高效的字符级转换器，提供了Pytorch实现和预训练的日语模型。",
                    "zh-hant": "CANINE是一種高效的字符級別轉換器，我們提供了Pytorch實現和預訓練的日語模型。"
                }
            },
            "https://github.com/reppy4620/Dialog": {
                "sub_category": "Transformer based models",
                "repository_name": "Dialog",
                "user_name": "reppy4620",
                "description": "A PyTorch Implementation of japanese chatbot using BERT and Transformer's decoder",
                "multilingual_descriptions": {
                    "en": "A PyTorch Implementation of japanese chatbot using BERT and Transformer's decoder",
                    "ja": "BERTとTransformerのデコーダーを使用した日本語チャットボットのPyTorch実装",
                    "zh-hans": "使用BERT和Transformer解码器的日语聊天机器人的PyTorch实现",
                    "zh-hant": "使用BERT和Transformer解碼器的日本聊天機器人的PyTorch實現"
                }
            },
            "https://github.com/retarfi/language-pretraining": {
                "sub_category": "Transformer based models",
                "repository_name": "language-pretraining",
                "user_name": "retarfi",
                "description": "BERT and ELECTRA models of PyTorch implementations for Japanese text.",
                "multilingual_descriptions": {
                    "en": "BERT and ELECTRA models of PyTorch implementations for Japanese text.",
                    "ja": "日本語テキストのPyTorch実装のBERTおよびELECTRAモデル。",
                    "zh-hans": "PyTorch实现的BERT和ELECTRA模型，适用于日语文本。",
                    "zh-hant": "PyTorch 實現的 BERT 和 ELECTRA 模型，適用於日文文本。"
                }
            },
            "https://github.com/ou-medinfo/medbertjp": {
                "sub_category": "Transformer based models",
                "repository_name": "medbertjp",
                "user_name": "ou-medinfo",
                "description": "Trials of pre-trained BERT models for the medical domain in Japanese.",
                "multilingual_descriptions": {
                    "en": "Trials of pre-trained BERT models for the medical domain in Japanese.",
                    "ja": "日本語の医療分野における事前学習済みBERTモデルの試験。",
                    "zh-hans": "在日本医疗领域中，对预训练BERT模型进行试验。",
                    "zh-hant": "在日本醫學領域中，預訓練BERT模型的試驗。"
                }
            },
            "https://github.com/cl-tohoku/ILYS-aoba-chatbot": {
                "sub_category": "Transformer based models",
                "repository_name": "ILYS-aoba-chatbot",
                "user_name": "cl-tohoku",
                "description": "ILYS-aoba-chatbot",
                "multilingual_descriptions": {
                    "en": "ILYS-aoba-chatbot",
                    "ja": "ILYS青葉チャットボット",
                    "zh-hans": "ILYS-傲霸聊天机器人",
                    "zh-hant": "ILYS-aoba聊天機器人"
                }
            },
            "https://github.com/megagonlabs/t5-japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "t5-japanese",
                "user_name": "megagonlabs",
                "description": "Codes to pre-train Japanese T5 models",
                "multilingual_descriptions": {
                    "en": "Codes to pre-train Japanese T5 models",
                    "ja": "日本語T5モデルの事前学習のためのコード",
                    "zh-hans": "用于预训练日语T5模型的代码",
                    "zh-hant": "預訓練日語T5模型的代碼"
                }
            },
            "https://github.com/yagays/pytorch_bert_japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "pytorch_bert_japanese",
                "user_name": "yagays",
                "description": "PytorchでBERTの日本語学習済みモデルを利用する",
                "multilingual_descriptions": {
                    "en": "Using a pre-trained Japanese BERT model with Pytorch.",
                    "ja": "PytorchでBERTの日本語学習済みモデルを利用する",
                    "zh-hans": "使用Pytorch利用BERT的日语预训练模型。",
                    "zh-hant": "使用Pytorch來使用BERT的日文預訓練模型。"
                }
            },
            "https://github.com/laboroai/Laboro-BERT-Japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "Laboro-BERT-Japanese",
                "user_name": "laboroai",
                "description": "Laboro BERT Japanese: Japanese BERT Pre-Trained With Web-Corpus",
                "multilingual_descriptions": {
                    "en": "Laboro BERT Japanese: Japanese BERT Pre-Trained With Web-Corpus",
                    "ja": "ラボロBERT日本語：Webコーパスで事前学習された日本語BERT",
                    "zh-hans": "劳动BERT日语：使用Web语料库预训练的日语BERT",
                    "zh-hant": "Laboro BERT 日語：使用 Web-Corpus 預訓練的日語 BERT"
                }
            },
            "https://github.com/tanreinama/RoBERTa-japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "RoBERTa-japanese",
                "user_name": "tanreinama",
                "description": "Japanese BERT Pretrained Model",
                "multilingual_descriptions": {
                    "en": "Japanese BERT Pretrained Model",
                    "ja": "日本語BERT事前学習モデル",
                    "zh-hans": "日语BERT预训练模型",
                    "zh-hant": "日本BERT預訓練模型"
                }
            },
            "https://github.com/tanreinama/aMLP-japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "aMLP-japanese",
                "user_name": "tanreinama",
                "description": "aMLP Transformer Model for Japanese",
                "multilingual_descriptions": {
                    "en": "aMLP Transformer Model for Japanese",
                    "ja": "日本語用のaMLPトランスフォーマーモデル",
                    "zh-hans": "用于日语的aMLP Transformer模型",
                    "zh-hant": "日本語的aMLP Transformer模型"
                }
            },
            "https://github.com/akirakubo/bert-japanese-aozora": {
                "sub_category": "Transformer based models",
                "repository_name": "bert-japanese-aozora",
                "user_name": "akirakubo",
                "description": "Japanese BERT trained on Aozora Bunko and Wikipedia, pre-tokenized by MeCab with UniDic & SudachiPy",
                "multilingual_descriptions": {
                    "en": "Japanese BERT trained on Aozora Bunko and Wikipedia, pre-tokenized by MeCab with UniDic & SudachiPy",
                    "ja": "青空文庫とウィキペディアでトレーニングされた日本語BERTで、UniDicとSudachiPyでプリトークナイズされました。",
                    "zh-hans": "使用UniDic和SudachiPy进行预分词的日语BERT，训练数据来自青空文库和维基百科。",
                    "zh-hant": "使用UniDic和SudachiPy預先分詞，並在青空文庫和維基百科上訓練的日語BERT。"
                }
            },
            "https://github.com/colorfulscoop/sbert-ja": {
                "sub_category": "Transformer based models",
                "repository_name": "sbert-ja",
                "user_name": "colorfulscoop",
                "description": "Code to train Sentence BERT Japanese model for Hugging Face Model Hub",
                "multilingual_descriptions": {
                    "en": "Code to train Sentence BERT Japanese model for Hugging Face Model Hub",
                    "ja": "ハギングフェイスモデルハブのSentence BERT日本語モデルをトレーニングするためのコード",
                    "zh-hans": "用于 Hugging Face 模型中心训练 Sentence BERT 日语模型的代码",
                    "zh-hant": "用於 Hugging Face Model Hub 的句子 BERT 日語模型訓練代碼"
                }
            },
            "https://github.com/PatrickJohnRamos/BERT-Japan-vaccination": {
                "sub_category": "Transformer based models",
                "repository_name": "BERT-Japan-vaccination",
                "user_name": "PatrickJohnRamos",
                "description": "Official fine-tuning code for \"Emotion Analysis of Japanese Tweets and Comparison to Vaccinations in Japan\"",
                "multilingual_descriptions": {
                    "en": "Official fine-tuning code for \"Emotion Analysis of Japanese Tweets and Comparison to Vaccinations in Japan\"",
                    "ja": "「日本のツイートの感情分析と日本のワクチン接種との比較」の公式微調整コード",
                    "zh-hans": "“日本推文情感分析与疫苗接种比较”的官方微调代码。",
                    "zh-hant": "「日本推文情緒分析與疫苗接種比較」官方微調程式碼"
                }
            },
            "https://github.com/tanreinama/gpt2-japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "gpt2-japanese",
                "user_name": "tanreinama",
                "description": "Japanese GPT2 Generation Model",
                "multilingual_descriptions": {
                    "en": "Japanese GPT2 Generation Model",
                    "ja": "日本語GPT2生成モデル",
                    "zh-hans": "日本GPT2生成模型",
                    "zh-hant": "日本語GPT2生成モデル"
                }
            },
            "https://github.com/tanreinama/text2text-japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "text2text-japanese",
                "user_name": "tanreinama",
                "description": "gpt-2 based text2text conversion model",
                "multilingual_descriptions": {
                    "en": "gpt-2 based text2text conversion model",
                    "ja": "GPT-2ベースのテキスト2テキスト変換モデル",
                    "zh-hans": "基于GPT-2的文本转换模型",
                    "zh-hant": "基於gpt-2的文本轉換模型"
                }
            },
            "https://github.com/colorfulscoop/gpt-ja": {
                "sub_category": "Transformer based models",
                "repository_name": "gpt-ja",
                "user_name": "colorfulscoop",
                "description": "GPT-2 Japanese model for HuggingFace's transformers",
                "multilingual_descriptions": {
                    "en": "GPT-2 Japanese model for HuggingFace's transformers",
                    "ja": "HuggingFaceのtransformers用のGPT-2日本語モデル",
                    "zh-hans": "HuggingFace的转换器GPT-2日语模型",
                    "zh-hant": "HuggingFace 的 transformers 的 GPT-2 日本模型"
                }
            },
            "https://github.com/astremo/friendly_JA-Model": {
                "sub_category": "Transformer based models",
                "repository_name": "friendly_JA-Model",
                "user_name": "astremo",
                "description": "MT model trained using the friendly_JA Corpus attempting to make Japanese easier/more accessible to occidental people by using the Latin/English derived katakana lexicon instead of the standard Sino-Japanese lexicon",
                "multilingual_descriptions": {
                    "en": "MT model trained using the friendly_JA Corpus attempting to make Japanese easier/more accessible to occidental people by using the Latin/English derived katakana lexicon instead of the standard Sino-Japanese lexicon",
                    "ja": "フレンドリー_JAコーパスを使用してトレーニングされたMTモデルは、標準的な漢字語彙の代わりにラテン語/英語由来のカタカナ語彙を使用することで、日本語を西洋人にとってより簡単/アクセスしやすくすることを目指しています。",
                    "zh-hans": "使用友好的日语语料库训练的MT模型，尝试使用拉丁/英语衍生的片假名词汇表，而不是标准的汉日词汇表，使日语更易于/更容易接近西方人。",
                    "zh-hant": "使用friendly_JA語料庫訓練的MT模型，嘗試通過使用拉丁/英語衍生的片假名詞彙表，而不是標準的漢日詞彙表，使日語對西方人更加容易/易於理解。"
                }
            },
            "https://github.com/alinear-corp/albert-japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "albert-japanese",
                "user_name": "alinear-corp",
                "description": "BERT with SentencePiece for Japanese text.",
                "multilingual_descriptions": {
                    "en": "BERT with SentencePiece for Japanese text.",
                    "ja": "日本語テキスト用のSentencePieceを使用したBERT。",
                    "zh-hans": "使用SentencePiece的BERT模型用于日语文本。",
                    "zh-hant": "使用SentencePiece的BERT模型進行日文文本處理。"
                }
            },
            "https://github.com/Kosuke-Szk/ja_text_bert": {
                "sub_category": "Transformer based models",
                "repository_name": "ja_text_bert",
                "user_name": "Kosuke-Szk",
                "description": "日本語WikipediaコーパスでBERTのPre-Trainedモデルを生成するためのリポジトリ",
                "multilingual_descriptions": {
                    "en": "Repository for generating a pre-trained BERT model using the Japanese Wikipedia corpus.",
                    "ja": "日本語WikipediaコーパスでBERTのPre-Trainedモデルを生成するためのリポジトリ",
                    "zh-hans": "用于在日语Wikipedia语料库上生成BERT预训练模型的存储库。",
                    "zh-hant": "在日語Wikipedia語料庫中生成BERT預訓練模型的存儲庫"
                }
            },
            "https://github.com/BandaiNamcoResearchInc/DistilBERT-base-jp": {
                "sub_category": "Transformer based models",
                "repository_name": "DistilBERT-base-jp",
                "user_name": "BandaiNamcoResearchInc",
                "description": "A Japanese DistilBERT pretrained model, which was trained on Wikipedia.",
                "multilingual_descriptions": {
                    "en": "A Japanese DistilBERT pretrained model, which was trained on Wikipedia.",
                    "ja": "日本語のDistilBERT事前学習モデルで、Wikipediaで訓練されました。",
                    "zh-hans": "一个在维基百科上训练的日本DistilBERT预训练模型。",
                    "zh-hant": "一個在維基百科上訓練的日本DistilBERT預訓練模型。"
                }
            },
            "https://github.com/informatix-inc/bert": {
                "sub_category": "Transformer based models",
                "repository_name": "bert",
                "user_name": "informatix-inc",
                "description": "This repository provides snippets to use RoBERTa pre-trained on Japanese corpus. Our dataset consists of Japanese Wikipedia and web-scrolled articles, 25GB in total. The released model is built based on that from HuggingFace.",
                "multilingual_descriptions": {
                    "en": "This repository provides snippets to use RoBERTa pre-trained on Japanese corpus. Our dataset consists of Japanese Wikipedia and web-scrolled articles, 25GB in total. The released model is built based on that from HuggingFace.",
                    "ja": "このリポジトリは、日本語コーパスで事前学習されたRoBERTaを使用するためのスニペットを提供しています。私たちのデータセットは、日本語のWikipediaとWebスクロールされた記事で、合計25GBです。リリースされたモデルは、HuggingFaceからのものをベースに構築されています。",
                    "zh-hans": "该存储库提供了使用RoBERTa在日语语料库上预训练的代码片段。我们的数据集包括日语维基百科和网络滚动文章，总共25GB。发布的模型是基于HuggingFace的模型构建的。",
                    "zh-hant": "這個存儲庫提供了使用 RoBERTa 預訓練於日本語語料庫的片段。我們的數據集包括日本維基百科和網頁滾動文章，總共 25GB。釋出的模型是基於 HuggingFace 的模型構建的。"
                }
            },
            "https://github.com/laboroai/Laboro-DistilBERT-Japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "Laboro-DistilBERT-Japanese",
                "user_name": "laboroai",
                "description": "Laboro DistilBERT Japanese",
                "multilingual_descriptions": {
                    "en": "Laboro DistilBERT Japanese",
                    "ja": "ラボロ DistilBERT 日本語",
                    "zh-hans": "劳罗DistilBERT日语",
                    "zh-hant": "勞羅 DistilBERT 日文"
                }
            },
            "https://github.com/studio-ousia/luke": {
                "sub_category": "Transformer based models",
                "repository_name": "luke",
                "user_name": "studio-ousia",
                "description": "- Language Understanding with Knowledge-based Embeddings",
                "multilingual_descriptions": {
                    "en": "LUKE -- Language Understanding with Knowledge-based Embeddings",
                    "ja": "LUKE -- 知識ベース埋め込みを用いた言語理解",
                    "zh-hans": "LUKE -- 基于知识嵌入的语言理解",
                    "zh-hant": "LUKE -- 基於知識嵌入的語言理解"
                }
            },
            "https://github.com/tanreinama/GPTSAN": {
                "sub_category": "Transformer based models",
                "repository_name": "GPTSAN",
                "user_name": "tanreinama",
                "description": "General-purpose Swich transformer based Japanese language mode",
                "multilingual_descriptions": {
                    "en": "General-purpose Swich transformer based Japanese language mode",
                    "ja": "汎用スイッチトランスをベースにした日本語モード",
                    "zh-hans": "通用开关变压器基于日语模式",
                    "zh-hant": "通用開關變壓器基於日語模式"
                }
            },
            "https://github.com/rinnakk/japanese-clip": {
                "sub_category": "Transformer based models",
                "repository_name": "japanese-clip",
                "user_name": "rinnakk",
                "description": "Japanese CLIP by rinna Co., Ltd.",
                "multilingual_descriptions": {
                    "en": "Japanese CLIP by rinna Co., Ltd.",
                    "ja": "株式会社りんなの日本語クリップ。",
                    "zh-hans": "日本CLIP由rinna有限公司制造。",
                    "zh-hant": "日本CLIP由rinna有限公司開發。"
                }
            },
            "https://github.com/EhimeNLP/AcademicBART": {
                "sub_category": "Transformer based models",
                "repository_name": "AcademicBART",
                "user_name": "EhimeNLP",
                "description": "We pretrained a BART-based Japanese masked language model on paper abstracts from the academic database CiNii Articles",
                "multilingual_descriptions": {
                    "en": "We pretrained a BART-based Japanese masked language model on paper abstracts from the academic database CiNii Articles",
                    "ja": "私たちは、学術データベースCiNii Articlesの論文要約を用いて、BARTベースの日本語マスク言語モデルを事前学習しました。",
                    "zh-hans": "我们在学术数据库CiNii Articles的论文摘要上预训练了一个基于BART的日语掩码语言模型。",
                    "zh-hant": "我們在學術數據庫CiNii Articles的論文摘要上，預先訓練了一個基於BART的日語遮罩語言模型。"
                }
            },
            "https://github.com/EhimeNLP/AcademicRoBERTa": {
                "sub_category": "Transformer based models",
                "repository_name": "AcademicRoBERTa",
                "user_name": "EhimeNLP",
                "description": "We pretrained a RoBERTa-based Japanese masked language model on paper abstracts from the academic database CiNii Articles.",
                "multilingual_descriptions": {
                    "en": "We pretrained a RoBERTa-based Japanese masked language model on paper abstracts from the academic database CiNii Articles.",
                    "ja": "私たちは、学術データベースCiNii Articlesの論文要約を用いて、RoBERTaベースの日本語マスク言語モデルを事前学習しました。",
                    "zh-hans": "我们在学术数据库CiNii Articles的论文摘要上预训练了一个基于RoBERTa的日语掩码语言模型。",
                    "zh-hant": "我們在學術數據庫CiNii Articles的論文摘要上預訓練了一個基於RoBERTa的日語遮罩語言模型。"
                }
            },
            "https://github.com/line/LINE-DistilBERT-Japanese": {
                "sub_category": "Transformer based models",
                "repository_name": "LINE-DistilBERT-Japanese",
                "user_name": "line",
                "description": "DistilBERT model pre-trained on 131 GB of Japanese web text. The teacher model is BERT-base that built in-house at LINE.",
                "multilingual_descriptions": {
                    "en": "DistilBERT model pre-trained on 131 GB of Japanese web text. The teacher model is BERT-base that built in-house at LINE.",
                    "ja": "131 GBの日本語ウェブテキストで事前学習されたDistilBERTモデル。教師モデルは、LINE内で構築されたBERT-baseです。",
                    "zh-hans": "DistilBERT模型在131GB的日语网络文本上进行了预训练。教师模型是LINE内部构建的BERT-base模型。",
                    "zh-hant": "DistilBERT模型預先在131 GB的日本網頁文本上進行了預訓練。教師模型是LINE內部建立的BERT-base模型。"
                }
            },
            "https://github.com/kunishou/Japanese-Alpaca-LoRA": {
                "sub_category": "Transformer based models",
                "repository_name": "Japanese-Alpaca-LoRA",
                "user_name": "kunishou",
                "description": "日本語に翻訳したStanford Alpacaのデータセットを用いてLLaMAをファインチューニングし作成したLow-Rank AdapterのリンクとGenerateサンプルコード",
                "multilingual_descriptions": {
                    "en": "Link to the Low-Rank Adapter created by fine-tuning LLaMA using the Stanford Alpaca dataset translated into Japanese, and sample code for generating it.",
                    "ja": "日本語に翻訳したStanford Alpacaのデータセットを用いてLLaMAをファインチューニングし作成したLow-Rank AdapterのリンクとGenerateサンプルコード",
                    "zh-hans": "使用翻译成日语的Stanford Alpaca数据集对LLaMA进行微调，创建了Low-Rank Adapter，并提供了链接和生成示例代码。",
                    "zh-hant": "使用經過日語翻譯的Stanford Alpaca資料集，進行LLaMA的微調並創建了Low-Rank Adapter，以下是其連結和生成樣本程式碼。"
                }
            },
            "https://github.com/nknytk/albert-japanese-tinysegmenter": {
                "sub_category": "Transformer based models",
                "repository_name": "albert-japanese-tinysegmenter",
                "user_name": "nknytk",
                "description": "Pretrained models, codes and guidances to pretrain official ALBERT(https://github.com/google-research/albert) on Japanese Wikipedia Resources",
                "multilingual_descriptions": {
                    "en": "Pretrained models, codes and guidances to pretrain official ALBERT(https://github.com/google-research/albert) on Japanese Wikipedia Resources",
                    "ja": "日本語のWikipediaリソースで公式ALBERT（https://github.com/google-research/albert）を事前学習するための事前学習済みモデル、コード、ガイダンスを提供します。",
                    "zh-hans": "提供预训练模型、代码和指南，以在日本维基百科资源上预训练官方ALBERT（https://github.com/google-research/albert）。",
                    "zh-hant": "提供預訓練模型、程式碼和指導文件，以在日本維基百科資源上預訓練官方ALBERT（https://github.com/google-research/albert）。"
                }
            },
            "https://github.com/lighttransport/japanese-llama-experiment": {
                "sub_category": "Transformer based models",
                "repository_name": "japanese-llama-experiment",
                "user_name": "lighttransport",
                "description": "Japanese LLaMa experiment",
                "multilingual_descriptions": {
                    "en": "日本のLLaMa実験",
                    "ja": "日本のLLaMa実験\n日本のLLaMa実験",
                    "zh-hans": "日本的LLaMa实验",
                    "zh-hant": "日本的LLaMa實驗"
                }
            },
            "https://github.com/zuntan03/easylightchatassistant": {
                "sub_category": "Transformer based models",
                "repository_name": "easylightchatassistant",
                "user_name": "zuntan03",
                "description": "EasyLightChatAssistant は軽量で検閲や規制のないローカル日本語モデルのLightChatAssistant を、KoboldCpp で簡単にお試しする環境です。",
                "multilingual_descriptions": {
                    "en": "EasyLightChatAssistant は軽量で検閲や規制のないローカル日本語モデルのLightChatAssistant を、KoboldCpp で簡単にお試しする環境です。",
                    "ja": "EasyLightChatAssistantは、KoboldCppで簡単に試すことができる、軽量で検閲や規制のないローカル日本語モデルのLightChatAssistantです。",
                    "zh-hans": "EasyLightChatAssistant是一个轻量级的、没有审查或限制的本地日语模型LightChatAssistant，在KoboldCpp中可以轻松尝试的环境。",
                    "zh-hant": "EasyLightChatAssistant 是一個輕量級的環境，用於輕鬆測試不受審查或規範的本地日語模型LightChatAssistant，使用KoboldCpp。"
                }
            }
        },
        "ChatGPT": {
            "https://github.com/Yuchi-Games/VRChatGPT": {
                "sub_category": null,
                "repository_name": "VRChatGPT",
                "user_name": "Yuchi-Games",
                "description": "ChatGPTを使ってVRChat上でお喋り出来るようにするプログラム。",
                "multilingual_descriptions": {
                    "en": "A program that allows you to chat using ChatGPT in VRChat.",
                    "ja": "ChatGPTを使ってVRChat上でお喋り出来るようにするプログラム。",
                    "zh-hans": "使用ChatGPT程序，可以在VRChat上进行聊天。",
                    "zh-hant": "使用ChatGPT的程式，讓您可以在VRChat上聊天。"
                }
            },
            "https://github.com/M-gen/AITuberDegikkoMirii": {
                "sub_category": null,
                "repository_name": "AITuberDegikkoMirii",
                "user_name": "M-gen",
                "description": "AITuberの基礎となる部分を開発しています",
                "multilingual_descriptions": {
                    "en": "We are developing the foundation of AITuber.",
                    "ja": "AITuberの基礎となる部分を開発しています",
                    "zh-hans": "我们正在开发AITuber的基础部分。",
                    "zh-hant": "我們正在開發AITuber的基礎部分。"
                }
            },
            "https://github.com/hirokidaichi/wanna": {
                "sub_category": null,
                "repository_name": "wanna",
                "user_name": "hirokidaichi",
                "description": "Shell command launcher with natural language",
                "multilingual_descriptions": {
                    "en": "Shell command launcher with natural language",
                    "ja": "自然言語でのシェルコマンド起動ツール",
                    "zh-hans": "带自然语言的Shell命令启动器",
                    "zh-hant": "具有自然語言的Shell命令啟動器"
                }
            },
            "https://github.com/uezo/ChatdollKit": {
                "sub_category": null,
                "repository_name": "ChatdollKit",
                "user_name": "uezo",
                "description": "ChatdollKit enables you to make your 3D model into a chatbot",
                "multilingual_descriptions": {
                    "en": "ChatdollKit enables you to make your 3D model into a chatbot",
                    "ja": "ChatdollKitを使用すると、あなたの3Dモデルをチャットボットに変換できます。",
                    "zh-hans": "ChatdollKit 可以让你将你的3D模型制作成聊天机器人。",
                    "zh-hant": "ChatdollKit 可以讓您將您的 3D 模型製作成聊天機器人。"
                }
            },
            "https://github.com/gyokuro33/ChuanhuChatGPTJapanese": {
                "sub_category": null,
                "repository_name": "ChuanhuChatGPTJapanese",
                "user_name": "gyokuro33",
                "description": "GUI for ChatGPT API For Japanese",
                "multilingual_descriptions": {
                    "en": "GUI for ChatGPT API For Japanese",
                    "ja": "日本語のChatGPT API用GUI",
                    "zh-hans": "ChatGPT API的日语GUI",
                    "zh-hant": "ChatGPT API 日文版的 GUI"
                }
            },
            "https://github.com/manju-summoner/AISisterAIChan": {
                "sub_category": null,
                "repository_name": "AISisterAIChan",
                "user_name": "manju-summoner",
                "description": "ChatGPT3.5を搭載した伺かゴースト「AI妹アイちゃん」です。利用には別途ChatGPTのAPIキーが必要です。",
                "multilingual_descriptions": {
                    "en": "This is a Siro Ghost equipped with ChatGPT3.5, called \"AI Imouto Aichan\". A separate ChatGPT API key is required to use it.",
                    "ja": "ChatGPT3.5を搭載した伺かゴースト「AI妹アイちゃん」です。利用には別途ChatGPTのAPIキーが必要です。",
                    "zh-hans": "这是搭载了ChatGPT3.5的伺かGhost“AI妹妹爱酱”。使用需要另外获取ChatGPT的API密钥。",
                    "zh-hant": "這是搭載了ChatGPT3.5的伺か鬼「AI妹アイちゃん」。使用需要另外準備ChatGPT的API金鑰。"
                }
            },
            "https://github.com/Geson-anko/vrchatbot": {
                "sub_category": null,
                "repository_name": "vrchatbot",
                "user_name": "Geson-anko",
                "description": "VRChatにAI Botを作るためのリポジトリ",
                "multilingual_descriptions": {
                    "en": "Repository for creating AI bots in VRChat",
                    "ja": "VRChatにAI Botを作るためのリポジトリ",
                    "zh-hans": "用于创建VRChat AI机器人的代码库",
                    "zh-hant": "建立VRChat AI Bot的存儲庫"
                }
            },
            "https://github.com/karakuri-ai/gptuber-by-langchain": {
                "sub_category": null,
                "repository_name": "gptuber-by-langchain",
                "user_name": "karakuri-ai",
                "description": "GPTがYouTuberをやります",
                "multilingual_descriptions": {
                    "en": "GPT will become a YouTuber.",
                    "ja": "GPTがYouTuberをやります",
                    "zh-hans": "GPT将成为YouTuber。",
                    "zh-hant": "GPT會當YouTuber"
                }
            },
            "https://github.com/supershaneski/openai-chatfriend": {
                "sub_category": null,
                "repository_name": "openai-chatfriend",
                "user_name": "supershaneski",
                "description": "A chatbox application built using Nuxt 3 powered by Open AI Text completion endpoint. You can select different personality of your AI friend. The default will respond in Japanese. You can use this app to practice your Nihongo skills!",
                "multilingual_descriptions": {
                    "en": "A chatbox application built using Nuxt 3 powered by Open AI Text completion endpoint. You can select different personality of your AI friend. The default will respond in Japanese. You can use this app to practice your Nihongo skills!",
                    "ja": "Nuxt 3を使用して構築されたチャットボックスアプリケーションで、Open AIテキスト補完エンドポイントによって動作します。AIフレンドの異なるパーソナリティを選択できます。デフォルトでは日本語で応答します。このアプリを使用して、日本語のスキルを練習することができます！",
                    "zh-hans": "一个使用Nuxt 3构建的聊天框应用程序，由Open AI文本完成端点提供支持。您可以选择不同的AI朋友个性。默认情况下，它会用日语回复。您可以使用此应用程序练习您的日语技能！",
                    "zh-hant": "一個使用 Nuxt 3 構建的聊天框應用程序，由 Open AI 文本完成端點提供支持。您可以選擇不同的 AI 朋友個性。默認情況下，它會用日語回答。您可以使用此應用程序練習您的日語技能！"
                }
            },
            "https://github.com/franzwong/chrome-ext-translate-to-hiragana-with-chatgpt": {
                "sub_category": null,
                "repository_name": "chrome-ext-translate-to-hiragana-with-chatgpt",
                "user_name": "franzwong",
                "description": "This Chrome extension can translate selected Japanese text to Hiragana by using ChatGPT.",
                "multilingual_descriptions": {
                    "en": "This Chrome extension can translate selected Japanese text to Hiragana by using ChatGPT.",
                    "ja": "このChrome拡張機能は、ChatGPTを使用して選択した日本語テキストをひらがなに翻訳できます。",
                    "zh-hans": "这个Chrome扩展程序可以使用ChatGPT将选定的日语文本翻译成平假名。",
                    "zh-hant": "這個 Chrome 擴充功能可以使用 ChatGPT 將選定的日文文本翻譯成平假名。"
                }
            },
            "https://github.com/nohanaga/azure-search-openai-demo": {
                "sub_category": null,
                "repository_name": "azure-search-openai-demo",
                "user_name": "nohanaga",
                "description": "このサンプルでは、Retrieval Augmented Generation パターンを使用して、独自のデータに対してChatGPT のような体験を作成するためのいくつかのアプローチを示しています。",
                "multilingual_descriptions": {
                    "en": "In this sample, we demonstrate several approaches to creating an experience similar to ChatGPT for proprietary data using the Retrieval Augmented Generation pattern.",
                    "ja": "このサンプルでは、Retrieval Augmented Generation パターンを使用して、独自のデータに対してChatGPT のような体験を作成するためのいくつかのアプローチを示しています。",
                    "zh-hans": "在这个样例中，我们使用检索增强生成模式，展示了几种方法来创建类似于ChatGPT的体验，以适用于您自己的数据。",
                    "zh-hant": "在這個範例中，我們使用檢索增強生成模式，展示了一些創建類似ChatGPT體驗的方法，以應用於自己的數據。"
                }
            },
            "https://github.com/pixiv/chatvrm": {
                "sub_category": null,
                "repository_name": "chatvrm",
                "user_name": "pixiv",
                "description": "ChatVRMはブラウザで簡単に3Dキャラクターと会話ができるデモアプリケーションです。",
                "multilingual_descriptions": {
                    "en": "ChatVRM is a demo application that allows you to easily chat with 3D characters in your browser.",
                    "ja": "ChatVRMはブラウザで簡単に3Dキャラクターと会話ができるデモアプリケーションです。",
                    "zh-hans": "ChatVRM是一个可以在浏览器中轻松与3D角色交谈的演示应用程序。",
                    "zh-hant": "ChatVRM是一個可以在瀏覽器中輕鬆與3D角色對話的演示應用程式。"
                }
            },
            "https://github.com/kmizu/sftly-replace": {
                "sub_category": null,
                "repository_name": "sftly-replace",
                "user_name": "kmizu",
                "description": "A Chrome extention to replace the selected text softly",
                "multilingual_descriptions": {
                    "en": "A Chrome extention to replace the selected text softly",
                    "ja": "選択したテキストをやさしく置き換えるためのChrome拡張機能",
                    "zh-hans": "一个Chrome扩展，可以轻松替换所选文本",
                    "zh-hant": "一個Chrome擴展程序，可以輕鬆替換所選文本"
                }
            },
            "https://github.com/rkmt/summarize_arxv": {
                "sub_category": null,
                "repository_name": "summarize_arxv",
                "user_name": "rkmt",
                "description": "Summarize arXiv paper with figures",
                "multilingual_descriptions": {
                    "en": "Summarize arXiv paper with figures",
                    "ja": "図を含むarXiv論文を要約する。",
                    "zh-hans": "用图表总结arXiv论文",
                    "zh-hant": "用圖表總結arXiv論文"
                }
            },
            "https://github.com/uezo/aiavatarkit": {
                "sub_category": null,
                "repository_name": "aiavatarkit",
                "user_name": "uezo",
                "description": "Building AI-based conversational avatars lightning fast",
                "multilingual_descriptions": {
                    "en": "Building AI-based conversational avatars lightning fast",
                    "ja": "AIベースの会話型アバターを超高速で構築する",
                    "zh-hans": "快速构建基于人工智能的对话化头像",
                    "zh-hant": "快速建立基於人工智慧的對話化頭像"
                }
            },
            "https://github.com/City-of-Kobe/pva-aoai-integration-solution": {
                "sub_category": null,
                "repository_name": "pva-aoai-integration-solution",
                "user_name": "City-of-Kobe",
                "description": "このリポジトリは、神戸市役所でのChatGPTの試行利用に向けて作成したフロー等をソリューション化し公開するものです。",
                "multilingual_descriptions": {
                    "en": "This repository is intended to package and release the flows and other solutions created for the trial use of ChatGPT at Kobe City Hall.",
                    "ja": "このリポジトリは、神戸市役所でのChatGPTの試行利用に向けて作成したフロー等をソリューション化し公開するものです。",
                    "zh-hans": "这个存储库是为了将在神户市政府试用ChatGPT的流程等转化为解决方案并公开而创建的。",
                    "zh-hant": "這個存儲庫是為了將在神戶市政府進行的ChatGPT試行使用所創建的流程等進行解決方案化並公開。"
                }
            },
            "https://github.com/azure-samples/jp-azureopenai-samples": {
                "sub_category": null,
                "repository_name": "jp-azureopenai-samples",
                "user_name": "azure-samples",
                "description": "Azure OpenAIを活用したアプリケーション実装のリファレンスを目的として、アプリのサンプル（リファレンスアーキテクチャ、サンプルコードとデプロイ手順）を無償提供しています。",
                "multilingual_descriptions": {
                    "en": "We provide free samples of applications (reference architecture, sample code, and deployment instructions) for the purpose of implementing applications using Azure OpenAI.",
                    "ja": "Azure OpenAIを活用したアプリケーション実装のリファレンスを目的として、アプリのサンプル（リファレンスアーキテクチャ、サンプルコードとデプロイ手順）を無償提供しています。",
                    "zh-hans": "为了提供使用Azure OpenAI实现应用程序的参考，我们免费提供应用程序示例（参考架构、示例代码和部署步骤）。",
                    "zh-hant": "為了提供使用Azure OpenAI進行應用程式實作的參考，我們免費提供應用程式的範例（參考架構、範例程式碼和部署步驟）。"
                }
            },
            "https://github.com/mutaguchi/character_chat": {
                "sub_category": null,
                "repository_name": "character_chat",
                "user_name": "mutaguchi",
                "description": "OpenAIのAPIを利用して、設定したキャラクターと日本語で会話するチャットスクリプトです。",
                "multilingual_descriptions": {
                    "en": "This is a chat script that uses OpenAI's API to have a conversation with a character set in Japanese.",
                    "ja": "OpenAIのAPIを利用して、設定したキャラクターと日本語で会話するチャットスクリプトです。",
                    "zh-hans": "这是一个使用OpenAI API的聊天脚本，可以与设定的角色用日语进行对话。",
                    "zh-hant": "這是一個使用OpenAI API的聊天腳本，可以與設定的角色用日語進行對話。"
                }
            },
            "https://github.com/sifue/chatgpt-slackbot": {
                "sub_category": null,
                "repository_name": "chatgpt-slackbot",
                "user_name": "sifue",
                "description": "OpenAIのChatGPT APIをSlack上で利用するためのSlackbotスクリプト (日本語での利用が前提)",
                "multilingual_descriptions": {
                    "en": "Slackbot script for using OpenAI's ChatGPT API on Slack (assumes usage in Japanese)",
                    "ja": "OpenAIのChatGPT APIをSlack上で利用するためのSlackbotスクリプト (日本語での利用が前提)",
                    "zh-hans": "用于在Slack上使用OpenAI的ChatGPT API的Slackbot脚本（假设使用日语）",
                    "zh-hant": "用於在Slack上使用OpenAI的ChatGPT API的Slackbot腳本（假設使用日語）\n用於在Slack上使用OpenAI的ChatGPT API的Slackbot腳本（假設使用日語）"
                }
            },
            "https://github.com/dahatake/chatgpt-prompt-sample-japanese": {
                "sub_category": null,
                "repository_name": "chatgpt-prompt-sample-japanese",
                "user_name": "dahatake",
                "description": "ChatGPT の Prompt のサンプルです。",
                "multilingual_descriptions": {
                    "en": "This is a sample of ChatGPT's prompt.",
                    "ja": "ChatGPT の Prompt のサンプルです。",
                    "zh-hans": "这是ChatGPT的提示示例。",
                    "zh-hant": "這是ChatGPT的提示示例。\nChatGPT的提示示例。"
                }
            },
            "https://github.com/adilmoujahid/kanji-flashcard-app-gpt4": {
                "sub_category": null,
                "repository_name": "kanji-flashcard-app-gpt4",
                "user_name": "adilmoujahid",
                "description": "A Japanese Kanji Flashcard App built using Python and Langchain, enhanced with the intelligence of GPT-4.",
                "multilingual_descriptions": {
                    "en": "A Japanese Kanji Flashcard App built using Python and Langchain, enhanced with the intelligence of GPT-4.",
                    "ja": "PythonとLangchainを使用して構築された日本語漢字フラッシュカードアプリで、GPT-4の知能が強化されています。",
                    "zh-hans": "一个使用Python和Langchain构建的日语汉字闪卡应用，结合了GPT-4的智能功能。",
                    "zh-hant": "一個使用Python和Langchain構建的日語漢字閃卡應用程序，並搭載了GPT-4的智能增強功能。"
                }
            },
            "https://github.com/jungokasai/IgakuQA": {
                "sub_category": null,
                "repository_name": "IgakuQA",
                "user_name": "jungokasai",
                "description": "Evaluating GPT-4 and ChatGPT on Japanese Medical Licensing Examinations",
                "multilingual_descriptions": {
                    "en": "Evaluating GPT-4 and ChatGPT on Japanese Medical Licensing Examinations",
                    "ja": "日本の医師免許試験におけるGPT-4とChatGPTの評価",
                    "zh-hans": "评估GPT-4和ChatGPT在日本医学执照考试中的表现",
                    "zh-hant": "評估GPT-4和ChatGPT在日本醫學執照考試上的表現"
                }
            },
            "https://github.com/retrieva/japagen": {
                "sub_category": null,
                "repository_name": "japagen",
                "user_name": "retrieva",
                "description": "日本語タスクにおけるLLMを用いた疑似学習データ生成の検討",
                "multilingual_descriptions": {
                    "en": "Investigation of pseudo-learning data generation using LLM in Japanese language tasks",
                    "ja": "日本語タスクにおけるLLMを用いた疑似学習データ生成の検討",
                    "zh-hans": "使用LLM在日语任务中生成伪学习数据的研究",
                    "zh-hant": "使用LLM在日語任務中生成虛擬學習數據的研究"
                }
            }
        },
        "Dictionary and IME": {
            "https://github.com/neologd/mecab-ipadic-neologd": {
                "sub_category": null,
                "repository_name": "mecab-ipadic-neologd",
                "user_name": "neologd",
                "description": "Neologism dictionary based on the language resources on the Web for mecab-ipadic",
                "multilingual_descriptions": {
                    "en": "Neologism dictionary based on the language resources on the Web for mecab-ipadic",
                    "ja": "「mecab-ipadic」に基づくウェブ上の言語リソースに基づく新語辞典",
                    "zh-hans": "基于网络语言资源的新词典，适用于mecab-ipadic。",
                    "zh-hant": "基於網絡語言資源的新詞典，適用於mecab-ipadic。"
                }
            },
            "https://github.com/PKSHATechnology-Research/tdmelodic": {
                "sub_category": null,
                "repository_name": "tdmelodic",
                "user_name": "PKSHATechnology-Research",
                "description": "A Japanese accent dictionary generator",
                "multilingual_descriptions": {
                    "en": "A Japanese accent dictionary generator",
                    "ja": "日本語アクセント辞書ジェネレーター",
                    "zh-hans": "一个日语口音词典生成器",
                    "zh-hant": "一個日本口音字典生成器"
                }
            },
            "https://github.com/neocl/jamdict": {
                "sub_category": null,
                "repository_name": "jamdict",
                "user_name": "neocl",
                "description": "Python 3 library for manipulating Jim Breen's JMdict, KanjiDic2, JMnedict and kanji-radical mappings",
                "multilingual_descriptions": {
                    "en": "Python 3 library for manipulating Jim Breen's JMdict, KanjiDic2, JMnedict and kanji-radical mappings",
                    "ja": "Jim Breen氏のJMdict、KanjiDic2、JMnedict、漢字ラジカルマッピングを操作するためのPython 3ライブラリ",
                    "zh-hans": "Python 3 库，用于操作 Jim Breen 的 JMdict、KanjiDic2、JMnedict 和汉字-部首映射。",
                    "zh-hant": "Python 3 庫，用於操作Jim Breen的JMdict、KanjiDic2、JMnedict和漢字-部首映射。"
                }
            },
            "https://github.com/polm/unidic-py": {
                "sub_category": null,
                "repository_name": "unidic-py",
                "user_name": "polm",
                "description": "Unidic packaged for installation via pip.",
                "multilingual_descriptions": {
                    "en": "Unidic packaged for installation via pip.",
                    "ja": "pipを介してインストールするためにパッケージ化されたUnidic。",
                    "zh-hans": "通过pip安装的Unidic包。",
                    "zh-hant": "透過pip安裝的Unidic打包。"
                }
            },
            "https://github.com/chakki-works/Japanese-Company-Lexicon": {
                "sub_category": null,
                "repository_name": "Japanese-Company-Lexicon",
                "user_name": "chakki-works",
                "description": "Japanese Company Lexicon (JCLdic)",
                "multilingual_descriptions": {
                    "en": "Japanese Company Lexicon (JCLdic)",
                    "ja": "日本企業用語辞典（JCLdic）",
                    "zh-hans": "日本公司词典（JCLdic）",
                    "zh-hant": "日本公司用語辭典（JCLdic）"
                }
            },
            "https://github.com/yagays/manbyo-sudachi": {
                "sub_category": null,
                "repository_name": "manbyo-sudachi",
                "user_name": "yagays",
                "description": "Sudachi向け万病辞書",
                "multilingual_descriptions": {
                    "en": "A comprehensive medical dictionary for Sudachi.",
                    "ja": "すだち向け万病辞書",
                    "zh-hans": "Sudachi专用万病词典",
                    "zh-hant": "酸橙專用萬病辭書"
                }
            },
            "https://github.com/tokuhirom/jawiki-kana-kanji-dict": {
                "sub_category": null,
                "repository_name": "jawiki-kana-kanji-dict",
                "user_name": "tokuhirom",
                "description": "Generate SKK/MeCab dictionary from Wikipedia(Japanese edition)",
                "multilingual_descriptions": {
                    "en": "Generate SKK/MeCab dictionary from Wikipedia(Japanese edition)",
                    "ja": "Wikipedia（日本語版）からSKK/MeCab辞書を生成する。",
                    "zh-hans": "从维基百科（日文版）生成SKK/MeCab词典",
                    "zh-hant": "從維基百科（日文版）生成SKK / MeCab詞典"
                }
            },
            "https://github.com/sociocom/JIWC-Dictionary": {
                "sub_category": null,
                "repository_name": "JIWC-Dictionary",
                "user_name": "sociocom",
                "description": "dictionary to find emotion related to text",
                "multilingual_descriptions": {
                    "en": "dictionary to find emotion related to text",
                    "ja": "テキストに関連する感情を見つけるための辞書",
                    "zh-hans": "用于查找与文本相关的情感的字典",
                    "zh-hant": "字典以尋找與文本相關的情感"
                }
            },
            "https://github.com/ku-nlp/JumanDIC": {
                "sub_category": null,
                "repository_name": "JumanDIC",
                "user_name": "ku-nlp",
                "description": "This repository contains source dictionary files to build dictionaries for JUMAN and Juman++.",
                "multilingual_descriptions": {
                    "en": "This repository contains source dictionary files to build dictionaries for JUMAN and Juman++.",
                    "ja": "このリポジトリには、JUMANとJuman ++の辞書を構築するためのソース辞書ファイルが含まれています。",
                    "zh-hans": "这个仓库包含源字典文件，用于构建 JUMAN 和 Juman++ 的字典。",
                    "zh-hant": "這個存儲庫包含源字典文件，用於構建 JUMAN 和 Juman++ 的字典。"
                }
            },
            "https://github.com/polm/ipadic-py": {
                "sub_category": null,
                "repository_name": "ipadic-py",
                "user_name": "polm",
                "description": "IPAdic packaged for easy use from Python.",
                "multilingual_descriptions": {
                    "en": "IPAdic packaged for easy use from Python.",
                    "ja": "Pythonから簡単に使用できるようにパッケージ化されたIPAdic。",
                    "zh-hans": "IPAdic打包为Python易用的形式。",
                    "zh-hant": "IPAdic打包成Python易於使用的套件。"
                }
            },
            "https://github.com/polm/unidic-lite": {
                "sub_category": null,
                "repository_name": "unidic-lite",
                "user_name": "polm",
                "description": "A small version of UniDic for easy pip installs.",
                "multilingual_descriptions": {
                    "en": "A small version of UniDic for easy pip installs.",
                    "ja": "簡単なpipインストール用のUniDicの小さなバージョン。",
                    "zh-hans": "一个小版本的UniDic，方便进行pip安装。",
                    "zh-hant": "一個小型的UniDic版本，方便進行pip安裝。"
                }
            },
            "https://github.com/peaceiris/emoji-ime-dictionary": {
                "sub_category": null,
                "repository_name": "emoji-ime-dictionary",
                "user_name": "peaceiris",
                "description": "日本語で絵文字入力をするための IME 追加辞書 orange_book Google 日本語入力などで日本語から絵文字への変換を可能にする IME 拡張辞書",
                "multilingual_descriptions": {
                    "en": "An IME additional dictionary for inputting emojis in Japanese, such as the Google Japanese Input, which enables conversion from Japanese to emojis through an IME extension dictionary.",
                    "ja": "日本語で絵文字入力をするための IME 追加辞書 orange_book Google 日本語入力などで日本語から絵文字への変換を可能にする IME 拡張辞書",
                    "zh-hans": "用于在日语中输入表情符号的 IME 附加词典，如 Google 日语输入法等，可将日语转换为表情符号的 IME 扩展词典。",
                    "zh-hant": "日本語輸入表情符號的 IME 附加詞典 orange_book，Google 日本語輸入等可將日本語轉換為表情符號的 IME 擴展詞典。"
                }
            },
            "https://github.com/peaceiris/google-ime-dictionary": {
                "sub_category": null,
                "repository_name": "google-ime-dictionary",
                "user_name": "peaceiris",
                "description": "日英変換・英語略語展開のための IME 追加辞書 orange_book 日本語から英語への和英変換や英語略語の展開を Google 日本語入力や ATOK などで可能にする IME 拡張辞書",
                "multilingual_descriptions": {
                    "en": "An IME additional dictionary called \"orange_book\" for Japanese-English conversion and expansion of English abbreviations, which enables Japanese-English conversion and expansion of English abbreviations in Google Japanese Input and ATOK.",
                    "ja": "日英変換・英語略語展開のための IME 追加辞書 orange_book 日本語から英語への和英変換や英語略語の展開を Google 日本語入力や ATOK などで可能にする IME 拡張辞書",
                    "zh-hans": "用于日英转换和英语缩写展开的 IME 附加词典 orange_book，可在 Google 日本语输入或 ATOK 等中实现从日语到英语的和英转换和英语缩写展开的 IME 扩展词典。",
                    "zh-hant": "日英轉換・英語縮寫展開的 IME 追加詞典 orange_book，可在 Google 日本語輸入法或 ATOK 等輸入法中實現從日語到英語的和英轉換和英語縮寫展開的 IME 擴展詞典。"
                }
            },
            "https://github.com/ncaq/dic-nico-intersection-pixiv": {
                "sub_category": null,
                "repository_name": "dic-nico-intersection-pixiv",
                "user_name": "ncaq",
                "description": "ニコニコ大百科とピクシブ百科事典の共通部分のIME辞書",
                "multilingual_descriptions": {
                    "en": "IME dictionary for the common parts of Nico Nico Daihyakka and Pixiv Encyclopedia.",
                    "ja": "ニコニコ大百科とピクシブ百科事典の共通部分のIME辞書",
                    "zh-hans": "NicoNico大百科和Pixiv百科全书共同部分的IME词典。",
                    "zh-hant": "NicoNico大百科和Pixiv百科全書共同部分的IME詞典"
                }
            },
            "https://github.com/KEINOS/google-ime-user-dictionary-ja-en": {
                "sub_category": null,
                "repository_name": "google-ime-user-dictionary-ja-en",
                "user_name": "KEINOS",
                "description": "GoogleIME用カタカナ語辞書プロジェクトのアーカイブです。Project archive of Google IME user dictionary from Katakana word ( Japanese loanword ) to English.",
                "multilingual_descriptions": {
                    "en": "GoogleIME用カタカナ語辞書プロジェクトのアーカイブです。Project archive of Google IME user dictionary from Katakana word ( Japanese loanword ) to English.",
                    "ja": "これはGoogleIME用カタカナ語辞書プロジェクトのアーカイブです。日本語の外来語から英語へのGoogle IMEユーザー辞書のプロジェクトアーカイブです。",
                    "zh-hans": "这是GoogleIME用的日语片假名词典项目的存档，从片假名词（即日语外来词）翻译成英语。",
                    "zh-hant": "這是GoogleIME用片假名詞彙字典專案的存檔，從日語外來詞的片假名詞彙轉換為英語。"
                }
            },
            "https://github.com/tiwanari/emoticon": {
                "sub_category": null,
                "repository_name": "emoticon",
                "user_name": "tiwanari",
                "description": "Google日本語入力の顔文字辞書∩(,,Ò‿Ó,,)∩",
                "multilingual_descriptions": {
                    "en": "Google Japanese Input's emoticon dictionary ∩(,,Ò‿Ó,,)∩",
                    "ja": "Google日本語入力の顔文字辞書∩(,,Ò‿Ó,,)∩",
                    "zh-hans": "Google日本语输入的表情符号字典∩(,,Ò‿Ó,,)∩",
                    "zh-hant": "Google日本語輸入的表情符號字典∩(,,Ò‿Ó,,)∩"
                }
            },
            "https://github.com/akirakubo/mecab-mozcdic": {
                "sub_category": null,
                "repository_name": "mecab-mozcdic",
                "user_name": "akirakubo",
                "description": "open source mozc dictionaryをMeCab辞書のフォーマットに変換したものです。",
                "multilingual_descriptions": {
                    "en": "This is a conversion of the open source mozc dictionary to the MeCab dictionary format.",
                    "ja": "open source mozc dictionaryをMeCab辞書のフォーマットに変換したものです。",
                    "zh-hans": "这是将开源mozc词典转换为MeCab词典格式的结果。",
                    "zh-hant": "這是將開源mozc字典轉換為MeCab字典格式的結果。"
                }
            },
            "https://github.com/albno273/denonbu-ime-dic": {
                "sub_category": null,
                "repository_name": "denonbu-ime-dic",
                "user_name": "albno273",
                "description": "電音IME: Microsoft IMEなどで利用することを想定した「電音部」関連用語の辞書",
                "multilingual_descriptions": {
                    "en": "Electric Sound Dictionary: A dictionary of terms related to \"Electric Sound Department\" intended for use with Microsoft IME and other similar software.",
                    "ja": "電音IME: Microsoft IMEなどで利用することを想定した「電音部」関連用語の辞書",
                    "zh-hans": "电音IME：用于Microsoft IME等的“电音部”相关术语词典。",
                    "zh-hant": "電音IME：針對Microsoft IME等輸入法所設計的「電音部」相關用語詞典。"
                }
            },
            "https://github.com/Umichang/nijisanji-ime-dic": {
                "sub_category": null,
                "repository_name": "nijisanji-ime-dic",
                "user_name": "Umichang",
                "description": "Microsoft IMEなどで利用することを想定した「にじさんじ」関連用語の用語辞書です。",
                "multilingual_descriptions": {
                    "en": "This is a glossary of \"Nijisanji\" related terms intended for use with Microsoft IME and other similar software.",
                    "ja": "Microsoft IMEなどで利用することを想定した「にじさんじ」関連用語の用語辞書です。",
                    "zh-hans": "这是一个“虹三”相关术语词典，旨在供Microsoft IME等使用。",
                    "zh-hant": "這是一個針對 Microsoft IME 等輸入法所設計的「にじさんじ」相關用語詞典。"
                }
            },
            "https://github.com/Umichang/pokemon-ime-dic": {
                "sub_category": null,
                "repository_name": "pokemon-ime-dic",
                "user_name": "Umichang",
                "description": "Microsoft IMEなどで利用することを想定した、現状判明している全てのポケモンの名前を網羅した用語辞書です。",
                "multilingual_descriptions": {
                    "en": "This is a terminology dictionary that covers the names of all currently known Pokémon, intended for use with Microsoft IME and similar software.",
                    "ja": "Microsoft IMEなどで利用することを想定した、現状判明している全てのポケモンの名前を網羅した用語辞書です。",
                    "zh-hans": "这是一个包含目前已知的所有宝可梦名称的术语词典，旨在供Microsoft IME等输入法使用。",
                    "zh-hant": "這是一個包含目前已知所有寶可夢名稱的用語詞典，旨在供Microsoft IME等輸入法使用。"
                }
            },
            "https://github.com/kujirahand/EJDict": {
                "sub_category": null,
                "repository_name": "EJDict",
                "user_name": "kujirahand",
                "description": "English-Japanese Dictionary data (Public Domain) EJDict-hand",
                "multilingual_descriptions": {
                    "en": "English-Japanese Dictionary data (Public Domain) EJDict-hand",
                    "ja": "英和辞書データ（パブリックドメイン）EJDict-hand",
                    "zh-hans": "英日词典数据（公共领域）EJDict-hand",
                    "zh-hant": "英日辭典數據（公共領域）EJDict-hand"
                }
            },
            "https://github.com/Rinrin0413/Ayashiy-Nipongo-Dic": {
                "sub_category": null,
                "repository_name": "Ayashiy-Nipongo-Dic",
                "user_name": "Rinrin0413",
                "description": "贵樣ばこゐ辞畫を使て正レい日本语を使ラことが出來ゑ。",
                "multilingual_descriptions": {
                    "en": "Using the precious tobacco box as a visual aid, it is possible to speak proper Japanese.",
                    "ja": "贵樣ばこゐ辞畫を使て正レい日本语を使ラことが出來ゑ。",
                    "zh-hans": "通过使用贵样笔画，可以正规地使用日语。",
                    "zh-hant": "利用貴公司提供的輸入法，可以正確地使用日語。"
                }
            },
            "https://github.com/kotofurumiya/genshin-dict": {
                "sub_category": null,
                "repository_name": "genshin-dict",
                "user_name": "kotofurumiya",
                "description": "Windows/macOSで使える原神の単語辞書です",
                "multilingual_descriptions": {
                    "en": "This is a vocabulary dictionary for Genshin Impact that can be used on Windows/macOS.",
                    "ja": "Windows/macOSで利用可能な原神の用語辞書です。",
                    "zh-hans": "这是一个可在Windows/macOS上使用的原神词典。",
                    "zh-hant": "這是可用於 Windows/macOS 的原神詞彙字典。"
                }
            },
            "https://github.com/scriptin/jmdict-simplified": {
                "sub_category": null,
                "repository_name": "jmdict-simplified",
                "user_name": "scriptin",
                "description": "JMdict and JMnedict in JSON format",
                "multilingual_descriptions": {
                    "en": "JMdict and JMnedict in JSON format",
                    "ja": "JMdictとJMnedictをJSON形式で入力してください。",
                    "zh-hans": "JMdict和JMnedict的JSON格式",
                    "zh-hant": "JMdict和JMnedict的JSON格式"
                }
            },
            "https://github.com/reasonset/mozcdict-ext": {
                "sub_category": null,
                "repository_name": "mozcdict-ext",
                "user_name": "reasonset",
                "description": "Convert external words into Mozc system dictionary",
                "multilingual_descriptions": {
                    "en": "Convert external words into Mozc system dictionary",
                    "ja": "外部の単語をMozcシステム辞書に変換する。",
                    "zh-hans": "将外部词汇转换为Mozc系统词典",
                    "zh-hant": "將外部單詞轉換為Mozc系統詞典"
                }
            },
            "https://github.com/utubo/mh-dict-jp": {
                "sub_category": null,
                "repository_name": "mh-dict-jp",
                "user_name": "utubo",
                "description": "MonsterHunterのユーザー辞書を作りたい…",
                "multilingual_descriptions": {
                    "en": "I want to create a user dictionary for Monster Hunter...",
                    "ja": "MonsterHunterのユーザー辞書を作りたい…",
                    "zh-hans": "想要制作Monster Hunter的用户词典…",
                    "zh-hant": "想要創建Monster Hunter的用戶詞典..."
                }
            },
            "https://github.com/stephenmk/jitenbot": {
                "sub_category": null,
                "repository_name": "jitenbot",
                "user_name": "stephenmk",
                "description": "Convert data from Japanese dictionary websites and applications into portable file formats",
                "multilingual_descriptions": {
                    "en": "Convert data from Japanese dictionary websites and applications into portable file formats",
                    "ja": "日本語の辞書ウェブサイトやアプリからデータをポータブルなファイル形式に変換する",
                    "zh-hans": "将日语字典网站和应用程序中的数据转换为便携文件格式",
                    "zh-hant": "將日本字典網站和應用程式的資料轉換為可攜式檔案格式。"
                }
            },
            "https://github.com/neologd/mecab-unidic-neologd": {
                "sub_category": null,
                "repository_name": "mecab-unidic-neologd",
                "user_name": "neologd",
                "description": "Neologism dictionary based on the language resources on the Web for mecab-unidic",
                "multilingual_descriptions": {
                    "en": "Neologism dictionary based on the language resources on the Web for mecab-unidic",
                    "ja": "mecab-unidicの言語リソースに基づいたネオログ辞書",
                    "zh-hans": "基于网络语言资源的mecab-unidic新词典",
                    "zh-hant": "基於網絡語言資源的mecab-unidic新詞典"
                }
            },
            "https://github.com/heppokofrontend/hololive-dictionary": {
                "sub_category": null,
                "repository_name": "hololive-dictionary",
                "user_name": "heppokofrontend",
                "description": "ホロライブ（ホロライブプロダクション）に関する辞書ファイルです。./dictionary フォルダ内のテキストファイルを使って、IMEに単語を追加できます。詳細はREADME.mdをご覧ください。",
                "multilingual_descriptions": {
                    "en": "This is a dictionary file about Hololive (Hololive Production). You can use the text files in the ./dictionary folder to add words to your IME. Please refer to README.md for more details.",
                    "ja": "ホロライブ（ホロライブプロダクション）に関する辞書ファイルです。./dictionary フォルダ内のテキストファイルを使って、IMEに単語を追加できます。詳細はREADME.mdをご覧ください。",
                    "zh-hans": "这是关于Hololive（Hololive Production）的词典文件。您可以使用./dictionary文件夹中的文本文件将单词添加到输入法中。详细信息请参阅README.md。",
                    "zh-hant": "這是關於Hololive（Hololive Production）的字典文件。您可以使用./dictionary文件夾中的文本文件將單詞添加到IME中。詳情請參閱README.md。"
                }
            },
            "https://github.com/themoeway/jmdict-yomitan": {
                "sub_category": null,
                "repository_name": "jmdict-yomitan",
                "user_name": "themoeway",
                "description": "JMdict, JMnedict, KANJIDIC for Yomitan/Yomichan.",
                "multilingual_descriptions": {
                    "en": "JMdict, JMnedict, KANJIDIC for Yomitan/Yomichan.",
                    "ja": "Yomitan/YomichanのためのJMdict、JMnedict、KANJIDIC。",
                    "zh-hans": "Yomitan / Yomichan的JMdict，JMnedict，KANJIDIC。",
                    "zh-hant": "Yomitan/Yomichan的JMdict、JMnedict和KANJIDIC。"
                }
            },
            "https://github.com/stephenmk/yomichan-jlpt-vocab": {
                "sub_category": null,
                "repository_name": "yomichan-jlpt-vocab",
                "user_name": "stephenmk",
                "description": "JLPT level tags for words in Yomichan",
                "multilingual_descriptions": {
                    "en": "JLPT level tags for words in Yomichan",
                    "ja": "Yomichanの単語に対するJLPTレベルのタグ",
                    "zh-hans": "Yomichan中单词的JLPT级别标签",
                    "zh-hant": "Yomichan中單詞的JLPT級別標籤"
                }
            },
            "https://github.com/stephenmk/Jitendex": {
                "sub_category": null,
                "repository_name": "Jitendex",
                "user_name": "stephenmk",
                "description": "A free and openly licensed Japanese-to-English dictionary compatible with multiple dictionary clients",
                "multilingual_descriptions": {
                    "en": "A free and openly licensed Japanese-to-English dictionary compatible with multiple dictionary clients",
                    "ja": "複数の辞書クライアントと互換性のある、無料でオープンライセンスの日本語-英語辞書",
                    "zh-hans": "一个免费且开放许可的日英词典，可与多个词典客户端兼容。",
                    "zh-hant": "一個免費且開放授權的日英詞典，可與多個詞典客戶端兼容。"
                }
            },
            "https://github.com/obfusk/jiten": {
                "sub_category": null,
                "repository_name": "jiten",
                "user_name": "obfusk",
                "description": "japanese android/cli/web dictionary based on jmdict/kanjidic — 日本語　辞典　和英辞典　漢英字典　和独辞典　和蘭辞典",
                "multilingual_descriptions": {
                    "en": "japanese android/cli/web dictionary based on jmdict/kanjidic — 日本語　辞典　和英辞典　漢英字典　和独辞典　和蘭辞典",
                    "ja": "JMDict/Kanjidicに基づいた日本語のAndroid/CLI/Web辞書 — 日本語辞典、和英辞典、漢英字典、和独辞典、和蘭辞典",
                    "zh-hans": "基于jmdict/kanjidic的日本安卓/命令行/网络词典 — 日英词典、汉英字典、德英词典、荷英词典",
                    "zh-hant": "基於jmdict/kanjidic的日本Android/CLI/Web字典 - 日語辭典、和英辭典、漢英字典、和德辭典、和蘭辭典"
                }
            },
            "https://github.com/MarvNC/pixiv-yomitan": {
                "sub_category": null,
                "repository_name": "pixiv-yomitan",
                "user_name": "MarvNC",
                "description": "Pixiv Encyclopedia Dictionary for Yomitan",
                "multilingual_descriptions": {
                    "en": "Pixiv Encyclopedia Dictionary for Yomitan",
                    "ja": "ピクシブ百科事典読谷のため",
                    "zh-hans": "Pixiv百科全书关于与那城的词典",
                    "zh-hant": "Pixiv 百科全書對於讀谷村的詞典"
                }
            },
            "https://github.com/nanjakkun/uchinaaguchi_dict": {
                "sub_category": null,
                "repository_name": "uchinaaguchi_dict",
                "user_name": "nanjakkun",
                "description": "うちなーぐち辞典（沖縄語辞典）",
                "multilingual_descriptions": {
                    "en": "Uchinaaguchi Dictionary (Okinawan Language Dictionary)",
                    "ja": "うちなーぐち辞典（沖縄語辞典）",
                    "zh-hans": "乌恩辞典（冲绳语辞典）",
                    "zh-hant": "琉球語辭典（沖繩語辭典）"
                }
            },
            "https://github.com/marvnc/yomitan-dictionaries": {
                "sub_category": null,
                "repository_name": "yomitan-dictionaries",
                "user_name": "marvnc",
                "description": "Japanese and Chinese dictionaries for Yomitan.",
                "multilingual_descriptions": {
                    "en": "Japanese and Chinese dictionaries for Yomitan.",
                    "ja": "読谷村のための日本語と中国語の辞書。",
                    "zh-hans": "与读谷村的日语和中文词典。",
                    "zh-hant": "讀取：讀取日本和中文詞典對於讀取。"
                }
            },
            "https://github.com/kengo700/mouse_over_dictionary": {
                "sub_category": null,
                "repository_name": "mouse_over_dictionary",
                "user_name": "kengo700",
                "description": "マウスオーバーした単語を自動で読み取る汎用辞書ツール",
                "multilingual_descriptions": {
                    "en": "Generic dictionary tool that automatically reads the word you mouse over.",
                    "ja": "マウスオーバーした単語を自動で読み取る汎用辞書ツール",
                    "zh-hans": "将鼠标悬停在单词上自动读取的通用词典工具",
                    "zh-hant": "滑鼠懸停在單字上時，自動讀取的通用辭典工具"
                }
            },
            "https://github.com/skk-dict/jisyo": {
                "sub_category": null,
                "repository_name": "jisyo",
                "user_name": "skk-dict",
                "description": "かな漢字変換エンジン SKKのための新しい辞書形式",
                "multilingual_descriptions": {
                    "en": "New dictionary format for the kana-kanji conversion engine SKK",
                    "ja": "かな漢字変換エンジン SKKのための新しい辞書形式",
                    "zh-hans": "为SKK输入法的新词典格式",
                    "zh-hant": "為SKK的新辭典格式的假名漢字轉換引擎"
                }
            },
            "https://github.com/ymrl/skk-jisyo.emoji-ja": {
                "sub_category": null,
                "repository_name": "skk-jisyo.emoji-ja",
                "user_name": "ymrl",
                "description": "日本語の読みから Emoji に変換するための SKK 辞書 😂",
                "multilingual_descriptions": {
                    "en": "SKK dictionary for converting Japanese readings to Emoji 😂",
                    "ja": "日本語の読みから Emoji に変換するための SKK 辞書 😂",
                    "zh-hans": "将日语读音转换为 Emoji 的 SKK 字典 😂",
                    "zh-hant": "日本語的讀音轉換為 Emoji 的 SKK 字典 😂"
                }
            },
            "https://github.com/netsphere-labs/anthy": {
                "sub_category": null,
                "repository_name": "anthy",
                "user_name": "netsphere-labs",
                "description": "Anthy is a kana-kanji conversion engine for Japanese. It converts roma-ji to kana, and the kana text to a mixed kana and kanji.",
                "multilingual_descriptions": {
                    "en": "Anthy is a kana-kanji conversion engine for Japanese. It converts roma-ji to kana, and the kana text to a mixed kana and kanji.",
                    "ja": "アンシーは日本語のかな漢字変換エンジンです。ローマ字をかなに変換し、かなテキストをかなと漢字の混合テキストに変換します。",
                    "zh-hans": "Anthy是一个用于日语的假名-汉字转换引擎。它可以将罗马字转换为假名，然后将假名文本转换为混合假名和汉字。",
                    "zh-hant": "Anthy是一個日文的假名漢字轉換引擎。它將羅馬字轉換為假名，並將假名文本轉換為混合假名和漢字。"
                }
            },
            "https://github.com/konyu/aws_dic_for_google_ime": {
                "sub_category": null,
                "repository_name": "aws_dic_for_google_ime",
                "user_name": "konyu",
                "description": "AWSサービス名のGoogle日本語入力向けの辞書",
                "multilingual_descriptions": {
                    "en": "Dictionary for Google Japanese input for AWS service names",
                    "ja": "AWSサービス名のGoogle日本語入力向けの辞書",
                    "zh-hans": "AWS服务名称的适用于Google日语输入的词典",
                    "zh-hant": "AWS服務名稱的Google日文輸入詞典"
                }
            },
            "https://github.com/tani/cl-skkserv": {
                "sub_category": null,
                "repository_name": "cl-skkserv",
                "user_name": "tani",
                "description": "Common LispによるSKK辞書サーバーとその拡張",
                "multilingual_descriptions": {
                    "en": "SKK dictionary server and its extensions using Common Lisp",
                    "ja": "Common LispによるSKK辞書サーバーとその拡張",
                    "zh-hans": "使用Common Lisp构建的SKK词典服务器及其扩展",
                    "zh-hant": "使用Common Lisp構建的SKK詞典伺服器及其擴展"
                }
            },
            "https://github.com/xorgy/anthy": {
                "sub_category": null,
                "repository_name": "anthy",
                "user_name": "xorgy",
                "description": "Anthy maintenance",
                "multilingual_descriptions": {
                    "en": "Anthy maintenance",
                    "ja": "アンシーのメンテナンス",
                    "zh-hans": "安蒂维护",
                    "zh-hant": "安西維護"
                }
            },
            "https://github.com/fujiwarat/anthy-unicode": {
                "sub_category": null,
                "repository_name": "anthy-unicode",
                "user_name": "fujiwarat",
                "description": "Another Anthy",
                "multilingual_descriptions": {
                    "en": "Anthy Unicode - Another Anthy",
                    "ja": "アンシーユニコード - アナザーアンシー",
                    "zh-hans": "安蒂Unicode - 另一个安蒂",
                    "zh-hant": "安西Unicode - 另一個安西"
                }
            },
            "https://github.com/ensan-hcl/azooKey": {
                "sub_category": null,
                "repository_name": "azooKey",
                "user_name": "ensan-hcl",
                "description": "azooKey: A Japanese Keyboard iOS Application Fully Developed in Swift",
                "multilingual_descriptions": {
                    "en": "azooKey: A Japanese Keyboard iOS Application Fully Developed in Swift",
                    "ja": "Input: azooKey: Swiftで完全に開発された日本語キーボードiOSアプリケーション\nOutput: azooKey：Swiftで完全に開発された日本語キーボードiOSアプリ",
                    "zh-hans": "azooKey：一款完全使用Swift开发的日本键盘iOS应用程序",
                    "zh-hant": "azooKey：一個完全使用Swift開發的日本鍵盤iOS應用程式"
                }
            },
            "https://github.com/ensan-hcl/azookey-desktop": {
                "sub_category": null,
                "repository_name": "azookey-desktop",
                "user_name": "ensan-hcl",
                "description": "Japanese Input Method \"azooKey\" for Desktop, supporting macOS",
                "multilingual_descriptions": {
                    "en": "Japanese Input Method azooKey for Desktop, supporting macOS",
                    "ja": "デスクトップ用の日本語入力メソッドazooKey、macOSをサポート",
                    "zh-hans": "日语输入法azooKey适用于桌面电脑，支持macOS。",
                    "zh-hant": "日文輸入法azooKey桌面版，支援macOS"
                }
            },
            "https://github.com/7ka-hiira/fcitx5-hazkey": {
                "sub_category": null,
                "repository_name": "fcitx5-hazkey",
                "user_name": "7ka-hiira",
                "description": "Japanese input method for fcitx5, powered by azooKey engine",
                "multilingual_descriptions": {
                    "en": "Japanese input method for fcitx5, powered by azooKey engine",
                    "ja": "fcitx5用の日本語入力メソッド、azooKeyエンジンによって提供されています。",
                    "zh-hans": "由azooKey引擎驱动的fcitx5日语输入法\n由azooKey引擎驱动的fcitx5日语输入法",
                    "zh-hant": "由azooKey引擎提供支援的fcitx5日文輸入法\n由azooKey引擎提供支援的fcitx5日文輸入法"
                }
            },
            "https://github.com/utuhiro78/mozcdic-ut-place-names": {
                "sub_category": null,
                "repository_name": "mozcdic-ut-place-names",
                "user_name": "utuhiro78",
                "description": "Mozc UT Place Name Dictionary is a dictionary converted from the Japan Post's ZIP code data for Mozc.",
                "multilingual_descriptions": {
                    "en": "Mozc UT Place Name Dictionary is a dictionary converted from the Japan Post's ZIP code data for Mozc.",
                    "ja": "Mozc UT 場所名辞書は、Mozc用に日本郵便の郵便番号データから変換された辞書です。",
                    "zh-hans": "Mozc UT地名词典是从日本邮政的邮政编码数据转换而来的词典，用于Mozc。",
                    "zh-hant": "Mozc UT 地名字典是從日本郵政的郵遞區號數據轉換而來的字典。"
                }
            },
            "https://github.com/ensan-hcl/azookeykanakanjiconverter": {
                "sub_category": null,
                "repository_name": "azookeykanakanjiconverter",
                "user_name": "ensan-hcl",
                "description": "Kana-Kanji Conversion Module written in Swift",
                "multilingual_descriptions": {
                    "en": "Kana-Kanji Conversion Module written in Swift",
                    "ja": "Swiftで書かれた仮名漢字変換モジュール",
                    "zh-hans": "用Swift编写的假名汉字转换模块",
                    "zh-hant": "使用Swift编写的假名-汉字转换模块"
                }
            },
            "https://github.com/ueno/libkkc": {
                "sub_category": null,
                "repository_name": "libkkc",
                "user_name": "ueno",
                "description": "Japanese Kana Kanji conversion input method library",
                "multilingual_descriptions": {
                    "en": "Japanese Kana Kanji conversion input method library",
                    "ja": "日本語仮名漢字変換入力方式ライブラリ",
                    "zh-hans": "日文假名汉字转换输入法库",
                    "zh-hant": "日文假名漢字轉換輸入法庫"
                }
            },
            "https://github.com/ueno/libskk": {
                "sub_category": null,
                "repository_name": "libskk",
                "user_name": "ueno",
                "description": "Japanese SKK input method library",
                "multilingual_descriptions": {
                    "en": "Japanese SKK input method library",
                    "ja": "日本語のSKK入力方式ライブラリ",
                    "zh-hans": "日本SKK输入法库",
                    "zh-hant": "日本 SKK 輸入法庫"
                }
            },
            "https://github.com/warihima/kanayomi-dict": {
                "sub_category": null,
                "repository_name": "kanayomi-dict",
                "user_name": "warihima",
                "description": "openjtalk形式のユーザー辞書",
                "multilingual_descriptions": {
                    "en": "User dictionary in openjtalk format",
                    "ja": "openjtalk形式のユーザー辞書",
                    "zh-hans": "openjtalk形式的用户词典",
                    "zh-hant": "openjtalk形式的用戶詞典"
                }
            },
            "https://github.com/cjkvi/cjkvi-dict": {
                "sub_category": null,
                "repository_name": "cjkvi-dict",
                "user_name": "cjkvi",
                "description": "漢字データベースの辞書関連データ",
                "multilingual_descriptions": {
                    "en": "Dictionary related data of the kanji database",
                    "ja": "漢字データベースの辞書関連データ",
                    "zh-hans": "汉字数据库的词典相关数据",
                    "zh-hant": "漢字資料庫的字典相關資料"
                }
            },
            "https://github.com/yocjyet/wlsp-classical": {
                "sub_category": null,
                "repository_name": "wlsp-classical",
                "user_name": "yocjyet",
                "description": "古典日本語の分類語彙表データ",
                "multilingual_descriptions": {
                    "en": "Classified vocabulary list data of classical Japanese",
                    "ja": "古典日本語の分類語彙表データ",
                    "zh-hans": "古典日本语的分类词汇表数据",
                    "zh-hant": "古典日本語的分類詞彙表數據"
                }
            },
            "https://github.com/marmooo/kanji-dict": {
                "sub_category": null,
                "repository_name": "kanji-dict",
                "user_name": "marmooo",
                "description": "漢字の書き順(筆順)・読み方・画数・部首・用例・成り立ちを調べるための漢字辞書です。Unicode 15.1 のすべての漢字 98,682字を収録しています。",
                "multilingual_descriptions": {
                    "en": "This is a kanji dictionary for looking up the stroke order, reading, number of strokes, radical, usage examples, and origin of kanji characters. It includes all 98,682 kanji characters in Unicode 15.1.",
                    "ja": "漢字の書き順(筆順)・読み方・画数・部首・用例・成り立ちを調べるための漢字辞書です。Unicode 15.1 のすべての漢字 98,682字を収録しています。",
                    "zh-hans": "这是一个用于查找汉字的笔顺、发音、画数、部首、用例和成立的汉字词典。收录了Unicode 15.1版本中的所有98,682个汉字。",
                    "zh-hant": "漢字的書寫順序(筆順)、讀音、畫數、部首、用例、起源等資訊的漢字詞典。收錄了Unicode 15.1版本中的所有漢字，共98682個字。"
                }
            },
            "https://github.com/mtripg6666tdr/Kaomoji_proj": {
                "sub_category": null,
                "repository_name": "Kaomoji_proj",
                "user_name": "mtripg6666tdr",
                "description": "(๑ ᴖ ᴑ ᴖ ๑)みょんかおもじ（旧Kaomoji_proj）はMicrosoft社の入力ソフト、Microsoft IME向けの顔文字の辞書を作成するプロジェクトです。",
                "multilingual_descriptions": {
                    "en": "(๑ ᴖ ᴑ ᴖ ๑) Myon Kaomoji (formerly Kaomoji_proj) is a project to create a dictionary of emoticons for Microsoft's input software, Microsoft IME.",
                    "ja": "(๑ ᴖ ᴑ ᴖ ๑)みょんかおもじ（旧Kaomoji_proj）はMicrosoft社の入力ソフト、Microsoft IME向けの顔文字の辞書を作成するプロジェクトです。",
                    "zh-hans": "(๑ ᴖ ᴑ ᴖ ๑)みょんかおもじ（旧Kaomoji_proj）是一个为Microsoft公司的输入软件Microsoft IME创建表情符号字典的项目。",
                    "zh-hant": "(๑ ᴖ ᴑ ᴖ ๑)みょんかおもじ（舊Kaomoji_proj）是一個為Microsoft公司的輸入軟件Microsoft IME製作表情符號詞典的項目。"
                }
            },
            "https://github.com/KazumaProject/kotlin-kana-kanji-converter": {
                "sub_category": null,
                "repository_name": "kotlin-kana-kanji-converter",
                "user_name": "KazumaProject",
                "description": "Kotlin かな漢字変換プログラム",
                "multilingual_descriptions": {
                    "en": "Kotlin Kana Kanji Conversion Program",
                    "ja": "Kotlin かな漢字変換プログラム",
                    "zh-hans": "Kotlin 平假名汉字转换程序",
                    "zh-hant": "Kotlin 假名漢字轉換程式"
                }
            },
            "https://github.com/chrisgrieser/alfred-japanese-dictionary": {
                "sub_category": null,
                "repository_name": "alfred-japanese-dictionary",
                "user_name": "chrisgrieser",
                "description": "Japanese-English Dictionary using jisho.org with audio, csv export of entries, and preview of dictionary sites.",
                "multilingual_descriptions": {
                    "en": "Japanese-English Dictionary using jisho.org with audio, csv export of entries, and preview of dictionary sites.",
                    "ja": "jisho.orgを使用した日本語-英語辞書、エントリーの音声付きCSVエクスポート、および辞書サイトのプレビュー。\njisho.orgを使用した日本語-英語辞書、エントリーの音声付きCSVエクスポート、および辞書サイトのプレビュー。",
                    "zh-hans": "使用jisho.org的日英词典，具有音频功能，可以导出条目的csv文件，并预览词典网站。",
                    "zh-hant": "使用jisho.org的日英詞典，具有音頻功能，可以導出CSV條目，並預覽詞典網站。"
                }
            },
            "https://github.com/tshatrov/ichiran": {
                "sub_category": null,
                "repository_name": "ichiran",
                "user_name": "tshatrov",
                "description": "Linguistic tools for texts in Japanese language",
                "multilingual_descriptions": {
                    "en": "Linguistic tools for texts in Japanese language",
                    "ja": "日本語のテキスト用言語ツール",
                    "zh-hans": "日语文本的语言工具",
                    "zh-hant": "日語文本的語言工具"
                }
            },
            "https://github.com/mojyack/mikan": {
                "sub_category": null,
                "repository_name": "mikan",
                "user_name": "mojyack",
                "description": "A Japanese input method.",
                "multilingual_descriptions": {
                    "en": "A Japanese input method.",
                    "ja": "日本語の入力方法。",
                    "zh-hans": "一个日本输入法。",
                    "zh-hant": "一種日本輸入法。"
                }
            },
            "https://github.com/sethclydesdale/colloquial-kansai-dictionary": {
                "sub_category": null,
                "repository_name": "colloquial-kansai-dictionary",
                "user_name": "sethclydesdale",
                "description": "A quick reference for the material taught in Colloquial Kansai Japanese.",
                "multilingual_descriptions": {
                    "en": "A quick reference for the material taught in Colloquial Kansai Japanese.",
                    "ja": "関西弁日本語の授業で教えられた教材の簡単な参考資料。",
                    "zh-hans": "关于关西方言日语教学材料的快速参考。",
                    "zh-hant": "關西方言日語教材的快速參考。"
                }
            },
            "https://github.com/hlorenzi/jisho-open": {
                "sub_category": null,
                "repository_name": "jisho-open",
                "user_name": "hlorenzi",
                "description": "Web frontend for the JMdict Japanese-English dictionary project, with study list support!",
                "multilingual_descriptions": {
                    "en": "Web frontend for the JMdict Japanese-English dictionary project, with study list support!",
                    "ja": "JMdict日本語英語辞書プロジェクトのWebフロントエンド、学習リストのサポート付き！\nJMdict日本語英語辞書プロジェクトのWebフロントエンド、学習リストのサポート付き！",
                    "zh-hans": "JMdict日语-英语词典项目的Web前端，支持学习列表！\nJMdict日语-英语词典项目的Web前端，支持学习列表！",
                    "zh-hant": "JMdict日英詞典項目的Web前端，支持學習列表！"
                }
            }
        },
        "Corpus": {
            "https://github.com/stockmarkteam/ner-wikipedia-dataset": {
                "sub_category": "Part-of-speech tagging / Named entity recognition",
                "repository_name": "ner-wikipedia-dataset",
                "user_name": "stockmarkteam",
                "description": "Wikipediaを用いた日本語の固有表現抽出データセット",
                "multilingual_descriptions": {
                    "en": "Dataset for extracting named entities in Japanese using Wikipedia",
                    "ja": "Wikipediaを用いた日本語の固有表現抽出データセット",
                    "zh-hans": "使用维基百科进行日语专有名词提取的数据集",
                    "zh-hant": "使用維基百科進行日語固有表現抽取的資料集"
                }
            },
            "https://github.com/Hironsan/IOB2Corpus": {
                "sub_category": "Part-of-speech tagging / Named entity recognition",
                "repository_name": "IOB2Corpus",
                "user_name": "Hironsan",
                "description": "Japanese IOB2 tagged corpus for Named Entity Recognition.",
                "multilingual_descriptions": {
                    "en": "Japanese IOB2 tagged corpus for Named Entity Recognition.",
                    "ja": "固有表現認識のための日本語IOB2タグ付きコーパス。",
                    "zh-hans": "用于命名实体识别的日语IOB2标记语料库。",
                    "zh-hant": "用於命名實體識別的日語IOB2標記語料庫。"
                }
            },
            "https://github.com/tmu-nlp/TwitterCorpus": {
                "sub_category": "Part-of-speech tagging / Named entity recognition",
                "repository_name": "TwitterCorpus",
                "user_name": "tmu-nlp",
                "description": "首都大日本語 Twitter コーパス",
                "multilingual_descriptions": {
                    "en": "Capital Japanese Twitter Corpus",
                    "ja": "首都大日本語 Twitter コーパス",
                    "zh-hans": "首都大日本语 Twitter 语料库",
                    "zh-hant": "首都大日本語 Twitter 語料庫"
                }
            },
            "https://github.com/megagonlabs/UD_Japanese-PUD": {
                "sub_category": "Part-of-speech tagging / Named entity recognition",
                "repository_name": "UD_Japanese-PUD",
                "user_name": "megagonlabs",
                "description": "Parallel Universal Dependencies.",
                "multilingual_descriptions": {
                    "en": "Parallel Universal Dependencies.",
                    "ja": "並列の普遍的な依存関係。",
                    "zh-hans": "并行通用依存关系。",
                    "zh-hant": "平行通用依存句法。"
                }
            },
            "https://github.com/megagonlabs/UD_Japanese-GSD": {
                "sub_category": "Part-of-speech tagging / Named entity recognition",
                "repository_name": "UD_Japanese-GSD",
                "user_name": "megagonlabs",
                "description": "Japanese data from the Google UDT 2.0.",
                "multilingual_descriptions": {
                    "en": "Japanese data from the Google UDT 2.0.",
                    "ja": "Google UDT 2.0からの日本語データ。",
                    "zh-hans": "谷歌UDT 2.0的日本数据。",
                    "zh-hant": "從Google UDT 2.0輸入的日本數據。"
                }
            },
            "https://github.com/ku-nlp/KWDLC": {
                "sub_category": "Part-of-speech tagging / Named entity recognition",
                "repository_name": "KWDLC",
                "user_name": "ku-nlp",
                "description": "Kyoto University Web Document Leads Corpus",
                "multilingual_descriptions": {
                    "en": "Kyoto University Web Document Leads Corpus",
                    "ja": "京都大学ウェブドキュメントリードコーパス",
                    "zh-hans": "京都大学网页文档引导语料库",
                    "zh-hant": "京都大學網頁文件引導語料庫"
                }
            },
            "https://github.com/ku-nlp/AnnotatedFKCCorpus": {
                "sub_category": "Part-of-speech tagging / Named entity recognition",
                "repository_name": "AnnotatedFKCCorpus",
                "user_name": "ku-nlp",
                "description": "Annotated Fuman Kaitori Center Corpus",
                "multilingual_descriptions": {
                    "en": "Annotated Fuman Kaitori Center Corpus",
                    "ja": "注釈付きの普門買取センターのコーパス",
                    "zh-hans": "注释版富满开拓中心语料库",
                    "zh-hant": "註釋版的富滿開取中心語料庫"
                }
            },
            "https://github.com/odashi/small_parallel_enja": {
                "sub_category": "Parallel corpus",
                "repository_name": "small_parallel_enja",
                "user_name": "odashi",
                "description": "50k English-Japanese Parallel Corpus for Machine Translation Benchmark.",
                "multilingual_descriptions": {
                    "en": "50k English-Japanese Parallel Corpus for Machine Translation Benchmark.",
                    "ja": "機械翻訳ベンチマーク用の50k英日並列コーパス。",
                    "zh-hans": "50k英日平行语料库，用于机器翻译基准测试。",
                    "zh-hant": "50k 英日平行語料庫，用於機器翻譯基準測試。"
                }
            },
            "https://github.com/zhang-jinyi/Web-Crawled-Corpus-for-Japanese-Chinese-NMT": {
                "sub_category": "Parallel corpus",
                "repository_name": "Web-Crawled-Corpus-for-Japanese-Chinese-NMT",
                "user_name": "zhang-jinyi",
                "description": "A Web Crawled Corpus for Japanese-Chinese NMT",
                "multilingual_descriptions": {
                    "en": "A Web Crawled Corpus for Japanese-Chinese NMT",
                    "ja": "日中NMTのためのWebクロールされたコーパス",
                    "zh-hans": "一个用于日中机器翻译的网络爬取语料库",
                    "zh-hant": "一個用於日中機器翻譯的網絡爬蟲語料庫"
                }
            },
            "https://github.com/shyyhs/CourseraParallelCorpusMining": {
                "sub_category": "Parallel corpus",
                "repository_name": "CourseraParallelCorpusMining",
                "user_name": "shyyhs",
                "description": "Coursera Corpus Mining and Multistage Fine-Tuning for Improving Lectures Translation",
                "multilingual_descriptions": {
                    "en": "Coursera Corpus Mining and Multistage Fine-Tuning for Improving Lectures Translation",
                    "ja": "Courseraのコーパスマイニングとマルチステージファインチューニングによる講義翻訳の改善",
                    "zh-hans": "Coursera语料库挖掘和多阶段微调，以提高讲座翻译质量。",
                    "zh-hant": "Coursera 課程挖掘和多階段微調，以改善講座翻譯"
                }
            },
            "https://github.com/rpryzant/JESC": {
                "sub_category": "Parallel corpus",
                "repository_name": "JESC",
                "user_name": "rpryzant",
                "description": "A large parallel corpus of English and Japanese",
                "multilingual_descriptions": {
                    "en": "A large parallel corpus of English and Japanese",
                    "ja": "英語と日本語の大規模な平行コーパス",
                    "zh-hans": "一个大型的英日平行语料库",
                    "zh-hant": "一個大型的英日平行語料庫"
                }
            },
            "https://github.com/tsuruoka-lab/AMI-Meeting-Parallel-Corpus": {
                "sub_category": "Parallel corpus",
                "repository_name": "AMI-Meeting-Parallel-Corpus",
                "user_name": "tsuruoka-lab",
                "description": "AMI Meeting Parallel Corpus",
                "multilingual_descriptions": {
                    "en": "AMI Meeting Parallel Corpus",
                    "ja": "AMIミーティング並列コーパス",
                    "zh-hans": "AMI会议平行语料库",
                    "zh-hant": "AMI會議平行語料庫"
                }
            },
            "https://github.com/DayuanJiang/giant_ja-en_parallel_corpus": {
                "sub_category": "Parallel corpus",
                "repository_name": "giant_ja-en_parallel_corpus",
                "user_name": "DayuanJiang",
                "description": "This directory includes a giant Japanese-English subtitle corpus. The raw data comes from the Stanford’s JESC project.",
                "multilingual_descriptions": {
                    "en": "This directory includes a giant Japanese-English subtitle corpus. The raw data comes from the Stanford’s JESC project.",
                    "ja": "このディレクトリには、巨大な日英字幕コーパスが含まれています。生データは、スタンフォード大学のJESCプロジェクトから取得されています。",
                    "zh-hans": "这个目录包含一个巨大的日英字幕语料库。原始数据来自斯坦福大学的JESC项目。",
                    "zh-hant": "這個目錄包含一個龐大的日英字幕語料庫。原始數據來自斯坦福大學的JESC項目。"
                }
            },
            "https://github.com/yusugomori/jesc_small": {
                "sub_category": "Parallel corpus",
                "repository_name": "jesc_small",
                "user_name": "yusugomori",
                "description": "Small Japanese-English Subtitle Corpus",
                "multilingual_descriptions": {
                    "en": "Small Japanese-English Subtitle Corpus",
                    "ja": "小さな日英字幕コーパス",
                    "zh-hans": "小型日英字幕语料库",
                    "zh-hant": "小型日英字幕語料庫"
                }
            },
            "https://github.com/marmooo/graded-enja-corpus": {
                "sub_category": "Parallel corpus",
                "repository_name": "graded-enja-corpus",
                "user_name": "marmooo",
                "description": "禁止用語や単語レベルを考慮した日英対訳コーパスです。",
                "multilingual_descriptions": {
                    "en": "This is a Japanese-English parallel corpus that takes into account prohibited language and word levels.",
                    "ja": "禁止用語や単語レベルを考慮した日英対訳コーパスです。",
                    "zh-hans": "这是一个考虑禁用词和单词级别的日英对照语料库。",
                    "zh-hant": "禁止用語或單詞級別考慮的日英對譯語料庫。"
                }
            },
            "https://github.com/dahlia/cjk-compsci-terms": {
                "sub_category": "Parallel corpus",
                "repository_name": "cjk-compsci-terms",
                "user_name": "dahlia",
                "description": "CJK computer science terms comparison / 中日韓電腦科學術語對照 / 日中韓のコンピュータ科学の用語対照 / 한·중·일 전산학 용어 대조",
                "multilingual_descriptions": {
                    "en": "Comparison of computer science terms in Chinese, Japanese, and Korean.",
                    "ja": "CJKコンピュータサイエンス用語比較 / 中日韓コンピュータサイエンス用語対照 / 日中韓コンピュータサイエンス用語比較 / 韓中日コンピュータサイエンス用語対照",
                    "zh-hans": "CJK计算机科学术语对照 / 中日韩电脑科学术语对照 / 日中韩计算机科学术语对照 / 韩中日计算机科学术语对照",
                    "zh-hant": "中日韓電腦科學術語對照 / 日中韓的電腦科學用語對照 / 韓中日電腦科學術語對照 / 한중일 컴퓨터 과학 용어 대조"
                }
            },
            "https://github.com/laboroai/Laboro-ParaCorpus": {
                "sub_category": "Parallel corpus",
                "repository_name": "Laboro-ParaCorpus",
                "user_name": "laboroai",
                "description": "Scripts for creating a Japanese-English parallel corpus and training NMT models",
                "multilingual_descriptions": {
                    "en": "Scripts for creating a Japanese-English parallel corpus and training NMT models",
                    "ja": "日英並列コーパスの作成スクリプトとNMTモデルのトレーニングに関するスクリプト",
                    "zh-hans": "用于创建日英平行语料库和训练NMT模型的脚本",
                    "zh-hant": "創建日英平行語料庫和訓練NMT模型的腳本"
                }
            },
            "https://github.com/Tzawa/google-vs-deepl-je": {
                "sub_category": "Parallel corpus",
                "repository_name": "google-vs-deepl-je",
                "user_name": "Tzawa",
                "description": "google-vs-deepl-je",
                "multilingual_descriptions": {
                    "en": "Google vs DeepL - Which one?",
                    "ja": "Google vs DeepL（日本語）",
                    "zh-hans": "谷歌 vs DeepL",
                    "zh-hant": "谷歌 vs DeepL JE"
                }
            },
            "https://github.com/ku-nlp/JMRD": {
                "sub_category": "Dialog corpus",
                "repository_name": "JMRD",
                "user_name": "ku-nlp",
                "description": "Japanese Movie Recommendation Dialogue dataset",
                "multilingual_descriptions": {
                    "en": "日本映画の推薦対話データセット",
                    "ja": "日本映画のおすすめ対話データセット",
                    "zh-hans": "日本电影推荐对话数据集",
                    "zh-hant": "日本電影推薦對話數據集"
                }
            },
            "https://github.com/1never/open2ch-dialogue-corpus": {
                "sub_category": "Dialog corpus",
                "repository_name": "open2ch-dialogue-corpus",
                "user_name": "1never",
                "description": "おーぷん2ちゃんねるをクロールして作成した対話コーパス",
                "multilingual_descriptions": {
                    "en": "A dialogue corpus created by crawling the 2channel open forum.",
                    "ja": "おーぷん2ちゃんねるをクロールして作成した対話コーパス",
                    "zh-hans": "使用爬虫程序从2ch论坛抓取并创建的对话语料库",
                    "zh-hant": "透過爬蟲從Open 2ch網站建立的對話語料庫"
                }
            },
            "https://github.com/tsuruoka-lab/BSD": {
                "sub_category": "Dialog corpus",
                "repository_name": "BSD",
                "user_name": "tsuruoka-lab",
                "description": "The Business Scene Dialogue corpus",
                "multilingual_descriptions": {
                    "en": "The Business Scene Dialogue corpus",
                    "ja": "ビジネスシーンの対話コーパス",
                    "zh-hans": "商业场景对话语料库",
                    "zh-hant": "商業場景對話語料庫"
                }
            },
            "https://github.com/megagonlabs/asdc": {
                "sub_category": "Dialog corpus",
                "repository_name": "asdc",
                "user_name": "megagonlabs",
                "description": "Accommodation Search Dialog Corpus (宿泊施設探索対話コーパス)",
                "multilingual_descriptions": {
                    "en": "Accommodation Search Dialog Corpus (宿泊施設探索対話コーパス)",
                    "ja": "宿泊施設探索対話コーパス",
                    "zh-hans": "住宿搜索对话语料库",
                    "zh-hant": "住宿搜索對話語料庫 (宿泊施設探索對話語料庫)"
                }
            },
            "https://github.com/MokkeMeguru/japanese-corpus": {
                "sub_category": "Dialog corpus",
                "repository_name": "japanese-corpus",
                "user_name": "MokkeMeguru",
                "description": "日本語の対話データ for seq2seq etc",
                "multilingual_descriptions": {
                    "en": "Japanese dialogue data for seq2seq, etc.",
                    "ja": "seq2seqなどに使用する日本語の対話データ",
                    "zh-hans": "用于seq2seq等的日语对话数据",
                    "zh-hant": "日語對話資料，適用於seq2seq等。"
                }
            },
            "https://github.com/cl-tohoku/BPersona-chat": {
                "sub_category": "Dialog corpus",
                "repository_name": "BPersona-chat",
                "user_name": "cl-tohoku",
                "description": "This repository contains the Japanese–English bilingual chat corpus BPersona-chat published in the paper Chat Translation Error Detection for Assisting Cross-lingual Communications at AACL-IJCNLP 2022's Workshop Eval4NLP 2022.",
                "multilingual_descriptions": {
                    "en": "This repository contains the Japanese–English bilingual chat corpus BPersona-chat published in the paper Chat Translation Error Detection for Assisting Cross-lingual Communications at AACL-IJCNLP 2022's Workshop Eval4NLP 2022.",
                    "ja": "このリポジトリには、AACL-IJCNLP 2022のWorkshop Eval4NLP 2022で発表された「Chat Translation Error Detection for Assisting Cross-lingual Communications」の論文で公開された日英バイリンガルチャットコーパスBPersna-chatが含まれています。",
                    "zh-hans": "这个仓库包含了日英双语聊天语料库BPersona-chat，该语料库已发表在AACL-IJCNLP 2022的Eval4NLP 2022研讨会上的论文《聊天翻译错误检测以协助跨语言交流》中。",
                    "zh-hant": "這個存儲庫包含了在AACL-IJCNLP 2022的Eval4NLP 2022研討會上發表的論文《Chat Translation Error Detection for Assisting Cross-lingual Communications》中所發布的日英雙語聊天語料庫BPersona-chat。"
                }
            },
            "https://github.com/jqk09a/japanese-daily-dialogue": {
                "sub_category": "Dialog corpus",
                "repository_name": "japanese-daily-dialogue",
                "user_name": "jqk09a",
                "description": "Japanese Daily Dialogue, or 日本語日常対話コーパス in Japanese, is a high-quality multi-turn dialogue dataset containing daily conversations on five topics: dailylife, school, travel, health, and entertainment.",
                "multilingual_descriptions": {
                    "en": "Japanese Daily Dialogue, or 日本語日常対話コーパス in Japanese, is a high-quality multi-turn dialogue dataset containing daily conversations on five topics: dailylife, school, travel, health, and entertainment.",
                    "ja": "「日本語日常対話コーパス」は、日常生活に関する会話を中心に、学校、旅行、健康、エンターテインメントの5つのトピックについての高品質なマルチターン対話データセットです。",
                    "zh-hans": "日本日常对话语料库，或日本语日常対話コーパス，是一个高质量的多轮对话数据集，包含五个主题的日常对话：日常生活，学校，旅行，健康和娱乐。",
                    "zh-hant": "日本語日常対話コーパス是一個高品質的多輪對話數據集，包含五個主題的日常對話：生活、學校、旅行、健康和娛樂。"
                }
            },
            "https://github.com/masanorihirano/llm-japanese-dataset": {
                "sub_category": "Dialog corpus",
                "repository_name": "llm-japanese-dataset",
                "user_name": "masanorihirano",
                "description": "LLM構築用の日本語チャットデータセット",
                "multilingual_descriptions": {
                    "en": "Japanese chat dataset for building LLM.",
                    "ja": "LLM構築用の日本語チャットデータセット",
                    "zh-hans": "LLM构建用的日语聊天数据集",
                    "zh-hant": "LLM構築用的日本語聊天資料集"
                }
            },
            "https://github.com/megagonlabs/jrte-corpus": {
                "sub_category": null,
                "repository_name": "jrte-corpus",
                "user_name": "megagonlabs",
                "description": "Japanese Realistic Textual Entailment Corpus (NLP 2020, LREC 2020)",
                "multilingual_descriptions": {
                    "en": "Japanese Realistic Textual Entailment Corpus (NLP 2020, LREC 2020)",
                    "ja": "日本の現実的なテキスト推論コーパス（NLP 2020、LREC 2020）",
                    "zh-hans": "日本现实文本蕴含语料库（NLP 2020，LREC 2020）",
                    "zh-hant": "日本現實文本蘊含語料庫（NLP 2020，LREC 2020）"
                }
            },
            "https://github.com/davidluzgouveia/kanji-data": {
                "sub_category": null,
                "repository_name": "kanji-data",
                "user_name": "davidluzgouveia",
                "description": "A JSON kanji dataset with updated JLPT levels and WaniKani information",
                "multilingual_descriptions": {
                    "en": "A JSON kanji dataset with updated JLPT levels and WaniKani information",
                    "ja": "更新されたJLPTレベルとWaniKani情報を含むJSON漢字データセット",
                    "zh-hans": "一个带有更新的JLPT级别和WaniKani信息的JSON汉字数据集。",
                    "zh-hant": "一個包含更新的JLPT級別和WaniKani信息的JSON漢字數據集。"
                }
            },
            "https://github.com/tmu-nlp/JapaneseWordSimilarityDataset": {
                "sub_category": null,
                "repository_name": "JapaneseWordSimilarityDataset",
                "user_name": "tmu-nlp",
                "description": "Japanese Word Similarity Dataset",
                "multilingual_descriptions": {
                    "en": "Japanese Word Similarity Dataset",
                    "ja": "日本語単語類似度データセット",
                    "zh-hans": "日语词语相似度数据集",
                    "zh-hant": "日本語詞語相似度資料集"
                }
            },
            "https://github.com/tmu-nlp/simple-jppdb": {
                "sub_category": null,
                "repository_name": "simple-jppdb",
                "user_name": "tmu-nlp",
                "description": "A paraphrase database for Japanese text simplification",
                "multilingual_descriptions": {
                    "en": "A paraphrase database for Japanese text simplification",
                    "ja": "日本語テキスト簡略化のための言い換えデータベース",
                    "zh-hans": "一个用于日语文本简化的释义数据库",
                    "zh-hant": "一個用於日文簡化的改述資料庫"
                }
            },
            "https://github.com/chakki-works/chABSA-dataset": {
                "sub_category": null,
                "repository_name": "chABSA-dataset",
                "user_name": "chakki-works",
                "description": "chakki's Aspect-Based Sentiment Analysis dataset",
                "multilingual_descriptions": {
                    "en": "chakki's Aspect-Based Sentiment Analysis dataset",
                    "ja": "チャッキのアスペクトベースの感情分析データセット",
                    "zh-hans": "查基的基于方面的情感分析数据集",
                    "zh-hant": "翻譯：chakki的基於方面的情感分析數據集"
                }
            },
            "https://github.com/SkelterLabsInc/JaQuAD": {
                "sub_category": null,
                "repository_name": "JaQuAD",
                "user_name": "SkelterLabsInc",
                "description": "JaQuAD: Japanese Question Answering Dataset for Machine Reading Comprehension (2022, Skelter Labs)",
                "multilingual_descriptions": {
                    "en": "JaQuAD: Japanese Question Answering Dataset for Machine Reading Comprehension (2022, Skelter Labs)",
                    "ja": "JaQuAD: 機械読解のための日本語質問応答データセット（2022年、Skelter Labs）",
                    "zh-hans": "JaQuAD：用于机器阅读理解的日语问答数据集（2022年，Skelter Labs）",
                    "zh-hant": "JaQuAD：日本機器閱讀理解問答資料集（2022年，Skelter Labs）"
                }
            },
            "https://github.com/verypluming/JaNLI": {
                "sub_category": null,
                "repository_name": "JaNLI",
                "user_name": "verypluming",
                "description": "Japanese Adversarial Natural Language Inference Dataset",
                "multilingual_descriptions": {
                    "en": "Japanese Adversarial Natural Language Inference Dataset",
                    "ja": "日本語の敵対的自然言語推論データセット",
                    "zh-hans": "日本对抗自然语言推理数据集",
                    "zh-hant": "日本對抗自然語言推論數據集"
                }
            },
            "https://github.com/megagonlabs/ebe-dataset": {
                "sub_category": null,
                "repository_name": "ebe-dataset",
                "user_name": "megagonlabs",
                "description": "Evidence-based Explanation Dataset (AACL-IJCNLP 2020)",
                "multilingual_descriptions": {
                    "en": "Evidence-based Explanation Dataset (AACL-IJCNLP 2020)",
                    "ja": "エビデンスに基づく説明データセット（AACL-IJCNLP 2020）",
                    "zh-hans": "基于证据的解释数据集（AACL-IJCNLP 2020）",
                    "zh-hant": "基於證據的解釋數據集（AACL-IJCNLP 2020）"
                }
            },
            "https://github.com/yagays/emoji-ja": {
                "sub_category": null,
                "repository_name": "emoji-ja",
                "user_name": "yagays",
                "description": "UNICODE絵文字の日本語読み/キーワード/分類辞書",
                "multilingual_descriptions": {
                    "en": "Japanese pronunciation/keywords/classification dictionary for UNICODE emojis.",
                    "ja": "UNICODE絵文字の日本語読み/キーワード/分類辞書",
                    "zh-hans": "UNICODE表情符号的日语读音/关键词/分类词典",
                    "zh-hant": "UNICODE繪文字的日本語讀音/關鍵字/分類詞典"
                }
            },
            "https://github.com/yagays/nayose-wikipedia-ja": {
                "sub_category": null,
                "repository_name": "nayose-wikipedia-ja",
                "user_name": "yagays",
                "description": "Wikipediaから作成した日本語名寄せデータセット",
                "multilingual_descriptions": {
                    "en": "Japanese name matching dataset created from Wikipedia.",
                    "ja": "Wikipediaから作成した日本語名寄せデータセット",
                    "zh-hans": "由维基百科创建的日语姓名对齐数据集",
                    "zh-hant": "從維基百科創建的日語名稱對齊數據集"
                }
            },
            "https://github.com/Hironsan/ja.text8": {
                "sub_category": null,
                "repository_name": "ja.text8",
                "user_name": "Hironsan",
                "description": "Japanese text8 corpus for word embedding.",
                "multilingual_descriptions": {
                    "en": "Japanese text8 corpus for word embedding.",
                    "ja": "単語埋め込みのための日本語テキスト8コーパス。",
                    "zh-hans": "用于词嵌入的日语文本8语料库。",
                    "zh-hant": "用於詞向量嵌入的日文文本8語料庫。"
                }
            },
            "https://github.com/KodairaTomonori/ThreeLineSummaryDataset": {
                "sub_category": null,
                "repository_name": "ThreeLineSummaryDataset",
                "user_name": "KodairaTomonori",
                "description": "3行要約データセット",
                "multilingual_descriptions": {
                    "en": "3-line summary dataset",
                    "ja": "3行要約データセット",
                    "zh-hans": "3行摘要数据集",
                    "zh-hant": "3行要約資料集"
                }
            },
            "https://github.com/hingston/japanese": {
                "sub_category": null,
                "repository_name": "japanese",
                "user_name": "hingston",
                "description": "This repo contains a list of the 44,998 most common Japanese words in order of frequency, as determined by the University of Leeds Corpus.",
                "multilingual_descriptions": {
                    "en": "This repo contains a list of the 44,998 most common Japanese words in order of frequency, as determined by the University of Leeds Corpus.",
                    "ja": "このリポジトリには、リーズ大学コーパスによって頻度順に決定された44,998の最も一般的な日本語単語のリストが含まれています。",
                    "zh-hans": "这个仓库包含了由利兹大学语料库确定的按频率排序的44,998个最常见的日语单词列表。",
                    "zh-hant": "這個存儲庫包含由利茲大學語料庫確定頻率排序的44,998個最常見的日語單詞列表。"
                }
            },
            "https://github.com/scriptin/kanji-frequency": {
                "sub_category": null,
                "repository_name": "kanji-frequency",
                "user_name": "scriptin",
                "description": "Kanji usage frequency data collected from various sources",
                "multilingual_descriptions": {
                    "en": "Kanji usage frequency data collected from various sources",
                    "ja": "様々な情報源から収集された漢字使用頻度データ",
                    "zh-hans": "从各种来源收集的汉字使用频率数据",
                    "zh-hant": "從各種來源收集的漢字使用頻率數據"
                }
            },
            "https://github.com/laboroai/TEDxJP-10K": {
                "sub_category": null,
                "repository_name": "TEDxJP-10K",
                "user_name": "laboroai",
                "description": "TEDxJP-10K ASR Evaluation Dataset",
                "multilingual_descriptions": {
                    "en": "TEDxJP-10K ASR Evaluation Dataset",
                    "ja": "TEDxJP-10K ASR 評価データセット",
                    "zh-hans": "TEDxJP-10K ASR 评估数据集",
                    "zh-hant": "TEDxJP-10K 語音辨識評估數據集"
                }
            },
            "https://github.com/chakki-works/CoARiJ": {
                "sub_category": null,
                "repository_name": "CoARiJ",
                "user_name": "chakki-works",
                "description": "Corpus of Annual Reports in Japan",
                "multilingual_descriptions": {
                    "en": "Corpus of Annual Reports in Japan",
                    "ja": "日本の年次報告書のコーパス",
                    "zh-hans": "日本年度报告语料库",
                    "zh-hant": "日本年報語料庫"
                }
            },
            "https://github.com/textlint-ja/technological-book-corpus-ja": {
                "sub_category": null,
                "repository_name": "technological-book-corpus-ja",
                "user_name": "textlint-ja",
                "description": "日本語で書かれた技術書を収集した生コーパス/ツール",
                "multilingual_descriptions": {
                    "en": "A raw corpus/tool that collects technical books written in Japanese.",
                    "ja": "日本語で書かれた技術書を収集した生コーパス/ツール",
                    "zh-hans": "收集了用日语编写的技术书籍的生语料库/工具",
                    "zh-hant": "收集了用日語撰寫的技術書籍的生語料庫/工具"
                }
            },
            "https://github.com/shirayu/ita-corpus-chuwa": {
                "sub_category": null,
                "repository_name": "ita-corpus-chuwa",
                "user_name": "shirayu",
                "description": "Chunked word annotation for ITA corpus",
                "multilingual_descriptions": {
                    "en": "Chunked word annotation for ITA corpus",
                    "ja": "ITAコーパスのチャンク化された単語注釈",
                    "zh-hans": "ITA语料库的分块词注释",
                    "zh-hant": "ITA語料庫的分塊詞註釋"
                }
            },
            "https://github.com/singletongue/wikipedia-utils": {
                "sub_category": null,
                "repository_name": "wikipedia-utils",
                "user_name": "singletongue",
                "description": "Utility scripts for preprocessing Wikipedia texts for NLP",
                "multilingual_descriptions": {
                    "en": "Utility scripts for preprocessing Wikipedia texts for NLP",
                    "ja": "NLPのためのWikipediaテキストの前処理のためのユーティリティスクリプト",
                    "zh-hans": "用于自然语言处理前处理维基百科文本的实用脚本",
                    "zh-hant": "用於自然語言處理的預處理維基百科文本的實用腳本"
                }
            },
            "https://github.com/MosasoM/inappropriate-words-ja": {
                "sub_category": null,
                "repository_name": "inappropriate-words-ja",
                "user_name": "MosasoM",
                "description": "日本語における不適切表現を収集します。自然言語処理の時のデータクリーニング用等に使えると思います。",
                "multilingual_descriptions": {
                    "en": "We will collect inappropriate expressions in Japanese. We believe it can be used for data cleaning in natural language processing.",
                    "ja": "日本語における不適切表現を収集します。自然言語処理の時のデータクリーニング用等に使えると思います。",
                    "zh-hans": "收集日语中不适当的表达方式。可用于自然语言处理时的数据清理等。",
                    "zh-hant": "收集日語中不適當的表達方式。可用於自然語言處理時的數據清理等。"
                }
            },
            "https://github.com/smartnews-smri/house-of-councillors": {
                "sub_category": null,
                "repository_name": "house-of-councillors",
                "user_name": "smartnews-smri",
                "description": "参議院の公式ウェブサイトから会派、議員、議案、質問主意書のデータを整理しました。",
                "multilingual_descriptions": {
                    "en": "We organized data on factions, members, bills, and interpellation requests from the official website of the House of Councillors.",
                    "ja": "参議院の公式ウェブサイトから会派、議員、議案、質問主意書のデータを整理しました。",
                    "zh-hans": "我们整理了参议院官方网站上的会派、议员、议案和质询意见书的数据。",
                    "zh-hant": "從參議院官方網站整理了會派、議員、議案、質問主意書的數據。"
                }
            },
            "https://github.com/smartnews-smri/house-of-representatives": {
                "sub_category": null,
                "repository_name": "house-of-representatives",
                "user_name": "smartnews-smri",
                "description": "国会議案データベース：衆議院",
                "multilingual_descriptions": {
                    "en": "National Diet Bill Database: House of Representatives",
                    "ja": "国会議案データベース：衆議院",
                    "zh-hans": "国会议案数据库：众议院",
                    "zh-hant": "國會議案資料庫：衆議院"
                }
            },
            "https://github.com/STAIR-Lab-CIT/STAIR-captions": {
                "sub_category": null,
                "repository_name": "STAIR-captions",
                "user_name": "STAIR-Lab-CIT",
                "description": "STAIR captions: large-scale Japanese image caption dataset",
                "multilingual_descriptions": {
                    "en": "STAIR captions: A Japanese image caption dataset on a large scale.",
                    "ja": "STAIRキャプション：大規模な日本語画像キャプションデータセット",
                    "zh-hans": "STAIR字幕：大规模日本图像字幕数据集",
                    "zh-hant": "STAIR字幕：大規模日本圖像字幕數據集"
                }
            },
            "https://github.com/ku-nlp/Winograd-Schema-Challenge-Ja": {
                "sub_category": null,
                "repository_name": "Winograd-Schema-Challenge-Ja",
                "user_name": "ku-nlp",
                "description": "Japanese Translation of Winograd Schema Challenge",
                "multilingual_descriptions": {
                    "en": "Japanese Translation of Winograd Schema Challenge",
                    "ja": "ウィノグラード・スキーマ・チャレンジの日本語翻訳",
                    "zh-hans": "Winograd模式挑战的日语翻译",
                    "zh-hant": "Winograd模式挑戰的日本翻譯"
                }
            },
            "https://github.com/ku-nlp/speechBSD": {
                "sub_category": null,
                "repository_name": "speechBSD",
                "user_name": "ku-nlp",
                "description": "An extension of the BSD corpus with audio and speaker attribute information",
                "multilingual_descriptions": {
                    "en": "An extension of the BSD corpus with audio and speaker attribute information",
                    "ja": "音声と話者属性情報を含むBSDコーパスの拡張版",
                    "zh-hans": "一个带有音频和说话人属性信息的BSD语料库扩展",
                    "zh-hant": "一個包含音訊和說話者屬性信息的BSD語料庫擴展版。"
                }
            },
            "https://github.com/mmorise/ita-corpus": {
                "sub_category": null,
                "repository_name": "ita-corpus",
                "user_name": "mmorise",
                "description": "ITAコーパスの文章リスト",
                "multilingual_descriptions": {
                    "en": "List of sentences in the ITA corpus",
                    "ja": "ITAコーパスの文章リスト",
                    "zh-hans": "ITA语料库的文章列表",
                    "zh-hant": "ITA語料庫的文章清單"
                }
            },
            "https://github.com/mmorise/rohan4600": {
                "sub_category": null,
                "repository_name": "rohan4600",
                "user_name": "mmorise",
                "description": "モーラバランス型日本語コーパス",
                "multilingual_descriptions": {
                    "en": "Mora balance Japanese corpus",
                    "ja": "モーラバランス型日本語コーパス",
                    "zh-hans": "摩拉平衡型日语语料库",
                    "zh-hant": "莫拉平衡型日本語語料庫"
                }
            },
            "https://github.com/whym/anlp-jp-history": {
                "sub_category": null,
                "repository_name": "anlp-jp-history",
                "user_name": "whym",
                "description": "言語処理学会年次大会講演の全リスト・機械可読版など",
                "multilingual_descriptions": {
                    "en": "A complete list and machine-readable version of the presentations at the annual conference of the Association for Computational Linguistics.",
                    "ja": "言語処理学会年次大会講演の全リスト・機械可読版など",
                    "zh-hans": "语言处理学会年度大会演讲的完整列表和机器可读版本等。",
                    "zh-hant": "語言處理學會年度大會演講的完整列表和機器可讀版本等。"
                }
            },
            "https://github.com/cl-tohoku/keigo_transfer_task": {
                "sub_category": null,
                "repository_name": "keigo_transfer_task",
                "user_name": "cl-tohoku",
                "description": "敬語変換タスクにおける評価用データセット",
                "multilingual_descriptions": {
                    "en": "Evaluation dataset for honorific language conversion task.",
                    "ja": "敬語変換タスクにおける評価用データセット",
                    "zh-hans": "敬语转换任务的评估数据集",
                    "zh-hant": "敬語轉換任務中的評估數據集"
                }
            },
            "https://github.com/jamesohortle/loanwords_gairaigo": {
                "sub_category": null,
                "repository_name": "loanwords_gairaigo",
                "user_name": "jamesohortle",
                "description": "English loanwords in Japanese",
                "multilingual_descriptions": {
                    "en": "English loanwords in Japanese",
                    "ja": "日本語における英語の借用語",
                    "zh-hans": "日语中的英语借词",
                    "zh-hant": "日本中的英語借詞"
                }
            },
            "https://github.com/wikiwikification/jawikicorpus": {
                "sub_category": null,
                "repository_name": "jawikicorpus",
                "user_name": "wikiwikification",
                "description": "Japanese-Wikipedia Wikification Corpus",
                "multilingual_descriptions": {
                    "en": "Japanese-Wikipedia Wikification Corpus",
                    "ja": "日本語ウィキペディアのウィキフィケーションコーパス",
                    "zh-hans": "日语维基百科链接语料库",
                    "zh-hant": "日本維基百科鏈接化語料庫"
                }
            },
            "https://github.com/yuukimiyo/GeneralPolicySpeechOfPrimeMinisterOfJapan": {
                "sub_category": null,
                "repository_name": "GeneralPolicySpeechOfPrimeMinisterOfJapan",
                "user_name": "yuukimiyo",
                "description": "This is the corpus of Japanese Text that general policy speech of prime minister of Japan",
                "multilingual_descriptions": {
                    "en": "This is the corpus of Japanese Text that general policy speech of prime minister of Japan",
                    "ja": "これは日本の総理大臣の一般政策演説のコーパスです。",
                    "zh-hans": "这是日本首相一般政策演讲的语料库。",
                    "zh-hant": "這是日本總理一般政策演說的語料庫。"
                }
            },
            "https://github.com/ids-cv/wrime": {
                "sub_category": null,
                "repository_name": "wrime",
                "user_name": "ids-cv",
                "description": "WRIME: 主観と客観の感情分析データセット",
                "multilingual_descriptions": {
                    "en": "WRIME: Subjective and Objective Emotion Analysis Dataset.",
                    "ja": "WRIME: 主観と客観の感情分析データセット",
                    "zh-hans": "WRIME：主观和客观情感分析数据集",
                    "zh-hant": "WRIME：主觀與客觀情感分析資料集"
                }
            },
            "https://github.com/sarulab-speech/jtubespeech": {
                "sub_category": null,
                "repository_name": "jtubespeech",
                "user_name": "sarulab-speech",
                "description": "JTubeSpeech: Corpus of Japanese speech collected from YouTube",
                "multilingual_descriptions": {
                    "en": "JTubeSpeech: Corpus of Japanese speech collected from YouTube",
                    "ja": "JTubeSpeech：YouTubeから収集された日本語音声のコーパス",
                    "zh-hans": "JTubeSpeech：从YouTube收集的日语语音语料库",
                    "zh-hant": "JTubeSpeech：從YouTube收集的日語語音語料庫"
                }
            },
            "https://github.com/maeda6uiui-backup/WikipediaWordFrequencyList": {
                "sub_category": null,
                "repository_name": "WikipediaWordFrequencyList",
                "user_name": "maeda6uiui-backup",
                "description": "日本語Wikipediaで使用される頻出単語のリスト",
                "multilingual_descriptions": {
                    "en": "List of frequently used words in Japanese Wikipedia.",
                    "ja": "日本語Wikipediaで使用される頻出単語のリスト",
                    "zh-hans": "在日语维基百科中使用频繁的单词列表",
                    "zh-hant": "在日語Wikipedia中常用的單詞列表"
                }
            },
            "https://github.com/rindybell/kokkosho_data": {
                "sub_category": null,
                "repository_name": "kokkosho_data",
                "user_name": "rindybell",
                "description": "車両不具合情報に関するデータセット",
                "multilingual_descriptions": {
                    "en": "Dataset on vehicle malfunction information.",
                    "ja": "車両不具合情報に関するデータセット",
                    "zh-hans": "车辆不具合信息数据集",
                    "zh-hant": "車輛不具合情報相關資料集"
                }
            },
            "https://github.com/ndl-lab/pdmocrdataset-part1": {
                "sub_category": null,
                "repository_name": "pdmocrdataset-part1",
                "user_name": "ndl-lab",
                "description": "デジタル化資料OCRテキスト化事業において作成されたOCR学習用データセット",
                "multilingual_descriptions": {
                    "en": "OCR learning dataset created for digital material OCR text conversion project.",
                    "ja": "デジタル化資料OCRテキスト化事業において作成されたOCR学習用データセット",
                    "zh-hans": "在数字化资料OCR文本化业务中创建的OCR学习用数据集",
                    "zh-hant": "在數位化資料OCR文字化業務中所創建的OCR學習用資料集。"
                }
            },
            "https://github.com/ndl-lab/huriganacorpus-ndlbib": {
                "sub_category": null,
                "repository_name": "huriganacorpus-ndlbib",
                "user_name": "ndl-lab",
                "description": "全国書誌データから作成した振り仮名のデータセット",
                "multilingual_descriptions": {
                    "en": "A dataset of furigana created from the National Bibliographic Data.",
                    "ja": "全国書誌データから作成した振り仮名のデータセット",
                    "zh-hans": "从全国书志数据创建的假名数据集",
                    "zh-hant": "從全國書目資料中創建的假名數據集"
                }
            },
            "https://github.com/Hiroshiba/jvs_hiho": {
                "sub_category": null,
                "repository_name": "jvs_hiho",
                "user_name": "Hiroshiba",
                "description": "JVS (Japanese versatile speech) コーパスの自作のラベル",
                "multilingual_descriptions": {
                    "en": "Creating labels for self-made JVS (Japanese Versatile Speech) corpus.",
                    "ja": "JVS（日本語多目的話者）コーパスのラベルの自作",
                    "zh-hans": "JVS（日本通用语音）语料库的自制标签",
                    "zh-hant": "JVS（日本語多目的話者）語料庫的自製標籤"
                }
            },
            "https://github.com/po3rin/hirakanadic": {
                "sub_category": null,
                "repository_name": "hirakanadic",
                "user_name": "po3rin",
                "description": "Allows Sudachi to normalize from hiragana to katakana from any compound word list",
                "multilingual_descriptions": {
                    "en": "Allows Sudachi to normalize from hiragana to katakana from any compound word list",
                    "ja": "任意の複合語リストから、スダチをひらがなからカタカナに正規化することができます。",
                    "zh-hans": "允许Sudachi从任何复合词列表中将平假名标准化为片假名。",
                    "zh-hant": "允許Sudachi從任何複合詞列表中將平假名轉換為片假名。"
                }
            },
            "https://github.com/anilogia/animedb": {
                "sub_category": null,
                "repository_name": "animedb",
                "user_name": "anilogia",
                "description": "約100年に渡るアニメ作品リストデータベース",
                "multilingual_descriptions": {
                    "en": "Anime works list database spanning approximately 100 years.",
                    "ja": "約100年に渡るアニメ作品リストデータベース",
                    "zh-hans": "约100年的动画作品列表数据库",
                    "zh-hant": "約100年的動畫作品清單資料庫"
                }
            },
            "https://github.com/SaitoLab/security_words": {
                "sub_category": null,
                "repository_name": "security_words",
                "user_name": "SaitoLab",
                "description": "サイバーセキュリティに関連する公的な組織の日英対応",
                "multilingual_descriptions": {
                    "en": "Japanese-English correspondence of public organizations related to cybersecurity.",
                    "ja": "サイバーセキュリティに関連する公的な組織の日英対応",
                    "zh-hans": "与网络安全相关的公共机构的日英对应",
                    "zh-hant": "與網路安全相關的公共組織的日英對應"
                }
            },
            "https://github.com/sugi2000/Data-on-Japanese-Diet-Members": {
                "sub_category": null,
                "repository_name": "Data-on-Japanese-Diet-Members",
                "user_name": "sugi2000",
                "description": "日本の国会議員のデータ",
                "multilingual_descriptions": {
                    "en": "Data of Japanese parliament members.",
                    "ja": "日本の国会議員のデータ",
                    "zh-hans": "日本国会议员的数据",
                    "zh-hant": "日本國會議員的資料"
                }
            },
            "https://github.com/yuta1984/honkoku-data": {
                "sub_category": null,
                "repository_name": "honkoku-data",
                "user_name": "yuta1984",
                "description": "歴史資料の市民参加型翻刻プラットフォーム「みんなで翻刻」のテキストデータ置き場です。 / Transcription texts created on Minna de Honkoku (https://honkoku.org), a crowdsourced transcription platform for historical Japanese documents.",
                "multilingual_descriptions": {
                    "en": "歴史資料の市民参加型翻刻プラットフォーム「みんなで翻刻」のテキストデータ置き場です。 / Transcription texts created on Minna de Honkoku (https://honkoku.org), a crowdsourced transcription platform for historical Japanese documents.",
                    "ja": "「みんなで翻刻」は、歴史資料の市民参加型翻刻プラットフォームであり、ここはそのテキストデータの置き場所です。https://honkoku.org で作成された歴史的な日本の文書の転写テキストです。",
                    "zh-hans": "这是一个历史资料的市民参与型翻刻平台“大家一起翻刻”的文本数据存储处。在这里可以找到由日本历史文献众包翻译平台“大家一起翻刻”创建的转录文本。",
                    "zh-hant": "這是歷史資料的市民參與型翻刻平台「大家一起翻刻」的文本數據存放處。/ 這些文本是在「大家一起翻刻」（https://honkoku.org）這個為日本歷史文獻提供群眾翻刻的平台上創建的。"
                }
            },
            "https://github.com/Katsumata420/wikihow_japanese": {
                "sub_category": null,
                "repository_name": "wikihow_japanese",
                "user_name": "Katsumata420",
                "description": "wikiHow dataset (Japanese version)",
                "multilingual_descriptions": {
                    "en": "データセット「wikiHow」（日本語版）",
                    "ja": "wikiHowデータセット（日本語版）",
                    "zh-hans": "维基百科数据集（日语版）",
                    "zh-hant": "wikiHow數據集（日語版）"
                }
            },
            "https://github.com/mercari/engineer-vocabulary-list": {
                "sub_category": null,
                "repository_name": "engineer-vocabulary-list",
                "user_name": "mercari",
                "description": "Engineer Vocabulary List in Japanese/English",
                "multilingual_descriptions": {
                    "en": "Engineer Vocabulary List in Japanese/English",
                    "ja": "日本語/英語のエンジニア用語リスト",
                    "zh-hans": "日英工程师词汇表",
                    "zh-hant": "日英工程師詞彙表"
                }
            },
            "https://github.com/verypluming/JSICK": {
                "sub_category": null,
                "repository_name": "JSICK",
                "user_name": "verypluming",
                "description": "Japanese Sentences Involving Compositional Knowledge (JSICK) Dataset/JSICK-stress Test Set",
                "multilingual_descriptions": {
                    "en": "Japanese Sentences Involving Compositional Knowledge (JSICK) Dataset/JSICK-stress Test Set",
                    "ja": "日本語の構成的知識を含む文（JSICK）データセット/JSICKストレステストセット",
                    "zh-hans": "日语组合知识句子（JSICK）数据集/JSICK压力测试集",
                    "zh-hant": "日本語組成知識（JSICK）資料集/JSICK壓力測試集"
                }
            },
            "https://github.com/JPCERTCC/phishurl-list": {
                "sub_category": null,
                "repository_name": "phishurl-list",
                "user_name": "JPCERTCC",
                "description": "Phishing URL dataset from JPCERT/CC",
                "multilingual_descriptions": {
                    "en": "Phishing URL dataset from JPCERT/CC",
                    "ja": "JPCERT/CCからのフィッシングURLデータセット",
                    "zh-hans": "来自JPCERT/CC的网络钓鱼URL数据集",
                    "zh-hant": "JPCERT/CC 的釣魚網址數據集"
                }
            },
            "https://github.com/shigashiyama/jcms": {
                "sub_category": null,
                "repository_name": "jcms",
                "user_name": "shigashiyama",
                "description": "A Japanese Corpus of Many Specialized Domains (JCMS)",
                "multilingual_descriptions": {
                    "en": "A Japanese Corpus of Many Specialized Domains (JCMS)",
                    "ja": "多数の専門分野をカバーした日本語コーパス（JCMS）",
                    "zh-hans": "一个日语多个专业领域语料库（JCMS）",
                    "zh-hant": "一個日本多個專業領域的語料庫 (JCMS)"
                }
            },
            "https://github.com/aozorahack/aozorabunko_text": {
                "sub_category": null,
                "repository_name": "aozorabunko_text",
                "user_name": "aozorahack",
                "description": "text-only archives of www.aozora.gr.jp",
                "multilingual_descriptions": {
                    "en": "text-only archives of www.aozora.gr.jp",
                    "ja": "www.aozora.gr.jpのテキストのみのアーカイブ",
                    "zh-hans": "www.aozora.gr.jp的纯文本档案",
                    "zh-hant": "www.aozora.gr.jp 的純文字檔案存檔"
                }
            },
            "https://github.com/astremo/friendly_JA-Corpus": {
                "sub_category": null,
                "repository_name": "friendly_JA-Corpus",
                "user_name": "astremo",
                "description": "friendly_JA is a parallel Japanese-to-Japanese corpus aimed at making Japanese easier by using the Latin/English derived katakana lexicon instead of the standard Sino-Japanese lexicon",
                "multilingual_descriptions": {
                    "en": "friendly_JA is a parallel Japanese-to-Japanese corpus aimed at making Japanese easier by using the Latin/English derived katakana lexicon instead of the standard Sino-Japanese lexicon",
                    "ja": "friendly_JAは、標準的な漢語辞典の代わりに、ラテン語/英語由来のカタカナ語彙を使用して日本語をより簡単にすることを目的とした、日本語から日本語への並列コーパスです。",
                    "zh-hans": "friendly_JA是一个平行的日语到日语语料库，旨在通过使用拉丁/英语衍生的片假名词汇表，而不是标准的汉日词汇表，使日语更容易理解。",
                    "zh-hant": "friendly_JA 是一個平行的日語對日語語料庫，旨在通過使用拉丁/英語衍生的片假名詞彙表，而不是標準的漢日詞彙表，使日語更容易。"
                }
            },
            "https://github.com/scriptin/topokanji": {
                "sub_category": null,
                "repository_name": "topokanji",
                "user_name": "scriptin",
                "description": "Topologically ordered lists of kanji for effective learning",
                "multilingual_descriptions": {
                    "en": "Topologically ordered lists of kanji for effective learning",
                    "ja": "効果的な学習のためのトポロジカルに並べられた漢字リスト",
                    "zh-hans": "拓扑排序的汉字列表，以实现有效学习。",
                    "zh-hant": "有效學習漢字的拓撲排序列表"
                }
            },
            "https://github.com/uribo/isbn4groups": {
                "sub_category": null,
                "repository_name": "isbn4groups",
                "user_name": "uribo",
                "description": "ISBN-13における日本語での出版物 (978-4-XXXXXXXXX) に関するデータ等",
                "multilingual_descriptions": {
                    "en": "Data related to Japanese publications in ISBN-13 format (978-4-XXXXXXXXX)",
                    "ja": "ISBN-13における日本語での出版物 (978-4-XXXXXXXXX) に関するデータ等",
                    "zh-hans": "与ISBN-13标准下的日语出版物（978-4-XXXXXXXXX）相关的数据等。",
                    "zh-hant": "關於ISBN-13中以日語出版的出版物（978-4-XXXXXXXXX）相關的數據等。"
                }
            },
            "https://github.com/komutan/NMeCab": {
                "sub_category": null,
                "repository_name": "NMeCab",
                "user_name": "komutan",
                "description": "NMeCab: About Japanese morphological analyzer on .NET",
                "multilingual_descriptions": {
                    "en": "NMeCab: About Japanese morphological analyzer on .NET",
                    "ja": "NMeCab: .NET上の日本語形態素解析器について",
                    "zh-hans": "NMeCab：关于.NET上的日语形态分析器",
                    "zh-hant": "NMeCab：關於在.NET上的日語形態分析器"
                }
            },
            "https://github.com/ndl-lab/ndlngramdata": {
                "sub_category": null,
                "repository_name": "ndlngramdata",
                "user_name": "ndl-lab",
                "description": "デジタル化資料から作成したOCRテキストデータのngram頻度統計情報のデータセット",
                "multilingual_descriptions": {
                    "en": "Dataset of n-gram frequency statistics information from OCR text data created from digitized materials.",
                    "ja": "デジタル化資料から作成したOCRテキストデータのngram頻度統計情報のデータセット",
                    "zh-hans": "由数字化资料创建的OCR文本数据的ngram频率统计信息数据集",
                    "zh-hant": "由數位化資料製作的OCR文字資料的ngram頻率統計資訊資料集。"
                }
            },
            "https://github.com/ndl-lab/ndlngramviewer_v2": {
                "sub_category": null,
                "repository_name": "ndlngramviewer_v2",
                "user_name": "ndl-lab",
                "description": "2023年1月にリニューアルしたNDL Ngram Viewerのソースコード等一式",
                "multilingual_descriptions": {
                    "en": "The complete set of source code for the NDL Ngram Viewer that was renewed in January 2023.",
                    "ja": "2023年1月にリニューアルしたNDL Ngram Viewerのソースコード等一式",
                    "zh-hans": "2023年1月更新的NDL Ngram Viewer源代码等套装",
                    "zh-hant": "2023年1月重新設計的NDL Ngram Viewer源代碼等一套"
                }
            },
            "https://github.com/japanese-law-analysis/data_set": {
                "sub_category": null,
                "repository_name": "data_set",
                "user_name": "japanese-law-analysis",
                "description": "法律・判例関係のデータセット",
                "multilingual_descriptions": {
                    "en": "Dataset related to laws and precedents.",
                    "ja": "法律・判例関係のデータセット",
                    "zh-hans": "法律·判例相关的数据集",
                    "zh-hant": "法律・判例相關的資料集"
                }
            },
            "https://github.com/shunk031/huggingface-datasets_wrime": {
                "sub_category": null,
                "repository_name": "huggingface-datasets_wrime",
                "user_name": "shunk031",
                "description": "WRIME for huggingface datasets",
                "multilingual_descriptions": {
                    "en": "WRIME for huggingface datasets",
                    "ja": "huggingfaceのデータセットのためのWRIME",
                    "zh-hans": "WRIME用于huggingface数据集。",
                    "zh-hant": "WRIME 的 HuggingFace 資料集"
                }
            },
            "https://github.com/ndl-lab/ndl-minhon-ocrdataset": {
                "sub_category": null,
                "repository_name": "ndl-minhon-ocrdataset",
                "user_name": "ndl-lab",
                "description": "NDL古典籍OCR学習用データセット（みんなで翻刻加工データ）",
                "multilingual_descriptions": {
                    "en": "NDL Classical Text OCR Learning Dataset (Collaborative Transcription and Processing Data)",
                    "ja": "NDL古典籍OCR学習用データセット（みんなで翻刻加工データ）",
                    "zh-hans": "NDL古典籍OCR学习用数据集（大家一起翻刻加工数据）",
                    "zh-hant": "NDL古典籍OCR學習用數據集（大家一起翻刻加工數據）"
                }
            },
            "https://github.com/AsPJT/PAX_SAPIENTICA": {
                "sub_category": null,
                "repository_name": "PAX_SAPIENTICA",
                "user_name": "AsPJT",
                "description": "GIS & Archaeological Simulator. 2023 in development.",
                "multilingual_descriptions": {
                    "en": "GIS & Archaeological Simulator is currently in development and is expected to be released in 2023.",
                    "ja": "GISと考古学シミュレーター。2023年開発中。",
                    "zh-hans": "GIS和考古模拟器。正在开发中，预计2023年发布。",
                    "zh-hant": "GIS和考古模擬器。2023年開發中。"
                }
            },
            "https://github.com/tasukuigarashi/j-liwc2015": {
                "sub_category": null,
                "repository_name": "j-liwc2015",
                "user_name": "tasukuigarashi",
                "description": "Japanese version of LIWC2015",
                "multilingual_descriptions": {
                    "en": "Japanese version of LIWC2015",
                    "ja": "LIWC2015の日本語版",
                    "zh-hans": "LIWC2015的日语版本",
                    "zh-hant": "LIWC2015的日文版本"
                }
            },
            "https://github.com/shunk031/huggingface-datasets_livedoor-news-corpus": {
                "sub_category": null,
                "repository_name": "huggingface-datasets_livedoor-news-corpus",
                "user_name": "shunk031",
                "description": "Japanese Livedoor news corpus for huggingface datasets",
                "multilingual_descriptions": {
                    "en": "Japanese Livedoor news corpus for huggingface datasets",
                    "ja": "ハグフェイスのデータセット用に、日本のライブドアニュースコーパスを入力してください。",
                    "zh-hans": "日本Livedoor新闻语料库，用于huggingface数据集。",
                    "zh-hant": "日本Livedoor新聞語料庫，用於huggingface數據集。"
                }
            },
            "https://github.com/shunk031/huggingface-datasets_JGLUE": {
                "sub_category": null,
                "repository_name": "huggingface-datasets_JGLUE",
                "user_name": "shunk031",
                "description": "JGLUE: Japanese General Language Understanding Evaluation for huggingface datasets",
                "multilingual_descriptions": {
                    "en": "JGLUE: Japanese General Language Understanding Evaluation for huggingface datasets",
                    "ja": "JGLUE：huggingfaceデータセットのための日本語一般言語理解評価",
                    "zh-hans": "JGLUE：适用于huggingface数据集的日语通用语言理解评估",
                    "zh-hant": "JGLUE：用於huggingface數據集的日語通用語言理解評估"
                }
            },
            "https://github.com/Language-Media-Lab/commonsense-moral-ja": {
                "sub_category": null,
                "repository_name": "commonsense-moral-ja",
                "user_name": "Language-Media-Lab",
                "description": "JCommonsenseMorality is a dataset created through crowdsourcing that reflects the commonsense morality of Japanese annotators.",
                "multilingual_descriptions": {
                    "en": "JCommonsenseMorality is a dataset created through crowdsourcing that reflects the commonsense morality of Japanese annotators.",
                    "ja": "JCommonsenseMoralityは、日本の注釈者の常識的な道徳を反映したクラウドソーシングによって作成されたデータセットです。",
                    "zh-hans": "JCommonsenseMorality是通过众包创建的数据集，反映了日本标注者的常识道德。",
                    "zh-hant": "JCommonsenseMorality是一個通過眾包創建的數據集，反映了日本標註者的常識道德。"
                }
            },
            "https://github.com/nlp-waseda/comet-atomic-ja": {
                "sub_category": null,
                "repository_name": "comet-atomic-ja",
                "user_name": "nlp-waseda",
                "description": "COMET-ATOMIC ja",
                "multilingual_descriptions": {
                    "en": "COMET-ATOMIC yes",
                    "ja": "コメット-アトミック ja",
                    "zh-hans": "COMET-ATOMIC ja\nCOMET-ATOMIC ja",
                    "zh-hant": "COMET-ATOMIC ja\n彗星原子 ja"
                }
            },
            "https://github.com/nlp-waseda/dcsg-ja": {
                "sub_category": null,
                "repository_name": "dcsg-ja",
                "user_name": "nlp-waseda",
                "description": "Dialogue Commonsense Graph in Japanese",
                "multilingual_descriptions": {
                    "en": "Dialogue Commonsense Graph in Japanese",
                    "ja": "日本語での対話の常識グラフ",
                    "zh-hans": "对话常识图（日语）",
                    "zh-hant": "日語對話常識圖表"
                }
            },
            "https://github.com/inspection-ai/japanese-toxic-dataset": {
                "sub_category": null,
                "repository_name": "japanese-toxic-dataset",
                "user_name": "inspection-ai",
                "description": "\"Proposal and Evaluation of Japanese Toxicity Schema\" provides a schema and dataset for toxicity in the Japanese language.",
                "multilingual_descriptions": {
                    "en": "\"Proposal and Evaluation of Japanese Toxicity Schema\" provides a schema and dataset for toxicity in the Japanese language.",
                    "ja": "「日本語毒性スキーマの提案と評価」は、日本語における毒性のスキーマとデータセットを提供します。",
                    "zh-hans": "《日本毒性模式的提案和评估》提供了一个日语毒性模式和数据集。",
                    "zh-hant": "「日本語毒性スキーマの提案と評価」は、日本語の毒性に関するスキーマとデータセットを提供します。"
                }
            },
            "https://github.com/CyberAgentAILab/camera": {
                "sub_category": null,
                "repository_name": "camera",
                "user_name": "CyberAgentAILab",
                "description": "CAMERA (CyberAgent Multimodal Evaluation for Ad Text GeneRAtion) is the Japanese ad text generation dataset.",
                "multilingual_descriptions": {
                    "en": "CAMERA (CyberAgent Multimodal Evaluation for Ad Text GeneRAtion) is the Japanese ad text generation dataset.",
                    "ja": "CAMERA（CyberAgent Multimodal Evaluation for Ad Text GeneRAtion）は、日本の広告テキスト生成データセットです。",
                    "zh-hans": "CAMERA（CyberAgent多模态广告文本生成评估）是日本广告文本生成数据集。",
                    "zh-hant": "CAMERA（CyberAgent多模態評估廣告文本生成）是日本的廣告文本生成數據集。"
                }
            },
            "https://github.com/tanreinama/Japanese-Fakenews-Dataset": {
                "sub_category": null,
                "repository_name": "Japanese-Fakenews-Dataset",
                "user_name": "tanreinama",
                "description": "日本語フェイクニュースデータセット",
                "multilingual_descriptions": {
                    "en": "Japanese Fake News Dataset",
                    "ja": "日本語フェイクニュースデータセット",
                    "zh-hans": "日语假新闻数据集",
                    "zh-hant": "日本語假新聞資料庫"
                }
            },
            "https://github.com/aiishii/jpn_explainable_qa_dataset": {
                "sub_category": null,
                "repository_name": "jpn_explainable_qa_dataset",
                "user_name": "aiishii",
                "description": "jpn_explainable_qa_dataset",
                "multilingual_descriptions": {
                    "en": "jpn_explainable_qa_dataset",
                    "ja": "jpn_explainable_qa_dataset",
                    "zh-hans": "jpn可解释问答数据集",
                    "zh-hant": "jpn可解釋問答數據集"
                }
            },
            "https://github.com/nlp-titech/copa-japanese": {
                "sub_category": null,
                "repository_name": "copa-japanese",
                "user_name": "nlp-titech",
                "description": "COPA Dataset in Japanese",
                "multilingual_descriptions": {
                    "en": "COPAデータセット（日本語）",
                    "ja": "日本語のCOPAデータセット",
                    "zh-hans": "COPA数据集（日语）",
                    "zh-hant": "日本語的 COPA 資料集"
                }
            },
            "https://github.com/masayu-a/WLSP-familiarity": {
                "sub_category": null,
                "repository_name": "WLSP-familiarity",
                "user_name": "masayu-a",
                "description": "Word Familiarity Rate for 'Word List by Semantic Principles (WLSP)'",
                "multilingual_descriptions": {
                    "en": "Word Familiarity Rate for 'Word List by Semantic Principles (WLSP)'",
                    "ja": "「意味原理に基づく単語リスト（WLSP）」の単語親しみ度率",
                    "zh-hans": "“语义原则词汇表（WLSP）”中的单词熟悉度率",
                    "zh-hant": "「按語義原則分類的單詞列表（WLSP）」的詞語熟悉度率"
                }
            },
            "https://github.com/matbahasa/ProSub": {
                "sub_category": null,
                "repository_name": "ProSub",
                "user_name": "matbahasa",
                "description": "A cross-linguistic study of pronoun substitutes and address terms",
                "multilingual_descriptions": {
                    "en": "A cross-linguistic study of pronoun substitutes and address terms",
                    "ja": "代名詞の代替物と呼びかけの言葉に関する言語間比較研究",
                    "zh-hans": "代词替代和称谓词的跨语言研究",
                    "zh-hant": "代詞替代和稱呼詞的跨語言研究"
                }
            },
            "https://github.com/nuko-yokohama/ramendb": {
                "sub_category": null,
                "repository_name": "ramendb",
                "user_name": "nuko-yokohama",
                "description": "なんとかデータベース( https://supleks.jp/ )からのスクレイピングツールと収集データ",
                "multilingual_descriptions": {
                    "en": "Scraping tool and collected data from Nantoka Database (https://supleks.jp/).",
                    "ja": "なんとかデータベース( https://supleks.jp/ )からのスクレイピングツールと収集データ",
                    "zh-hans": "从某种数据库（https://supleks.jp/）进行的网络爬虫工具和收集的数据。",
                    "zh-hant": "從なんとか資料庫(https://supleks.jp/)的網頁爬蟲工具和收集的資料。"
                }
            },
            "https://github.com/shunk031/huggingface-datasets_CAMERA": {
                "sub_category": null,
                "repository_name": "huggingface-datasets_CAMERA",
                "user_name": "shunk031",
                "description": "CAMERA (CyberAgent Multimodal Evaluation for Ad Text GeneRAtion) for huggingface datasets",
                "multilingual_descriptions": {
                    "en": "CAMERA (CyberAgent Multimodal Evaluation for Ad Text GeneRAtion) for huggingface datasets",
                    "ja": "huggingfaceデータセットのためのCAMERA（CyberAgent Multimodal Evaluation for Ad Text GeneRAtion）",
                    "zh-hans": "针对huggingface数据集的CAMERA（CyberAgent多模态广告文本生成评估）",
                    "zh-hant": "相機（CyberAgent多模態評估廣告文本生成）用於huggingface數據集"
                }
            },
            "https://github.com/nlp-waseda/FactCheckSentenceNLI-FCSNLI-": {
                "sub_category": null,
                "repository_name": "FactCheckSentenceNLI-FCSNLI-",
                "user_name": "nlp-waseda",
                "description": "FactCheckSentenceNLIデータセット",
                "multilingual_descriptions": {
                    "en": "FactCheckSentenceNLIデータセット",
                    "ja": "ファクトチェック文NLIデータセット",
                    "zh-hans": "事实核查句子NLI数据集",
                    "zh-hant": "事實檢查句子NLI數據集"
                }
            },
            "https://github.com/kunishou/databricks-dolly-15k-ja": {
                "sub_category": null,
                "repository_name": "databricks-dolly-15k-ja",
                "user_name": "kunishou",
                "description": "databricks/dolly-v2-12b の学習データに使用されたdatabricks-dolly-15k.jsonl を日本語に翻訳したデータセットになります。",
                "multilingual_descriptions": {
                    "en": "This is a dataset that has been translated into Japanese from the databricks-dolly-15k.jsonl file used for training in databricks/dolly-v2-12b.",
                    "ja": "databricks/dolly-v2-12b の学習データに使用されたdatabricks-dolly-15k.jsonl を日本語に翻訳したデータセットになります。",
                    "zh-hans": "这是一个将 databricks/dolly-v2-12b 的训练数据中使用的 databricks-dolly-15k.jsonl 翻译成日语的数据集。",
                    "zh-hant": "這是將用於databricks/dolly-v2-12b的學習數據中使用的databricks-dolly-15k.jsonl翻譯成日語的數據集。"
                }
            },
            "https://github.com/ku-nlp/EaST-MELD": {
                "sub_category": null,
                "repository_name": "EaST-MELD",
                "user_name": "ku-nlp",
                "description": "EaST-MELD is an English-Japanese dataset for emotion-aware speech translation based on MELD.",
                "multilingual_descriptions": {
                    "en": "EaST-MELD is an English-Japanese dataset for emotion-aware speech translation based on MELD.",
                    "ja": "EaST-MELDは、MELDに基づく感情認識音声翻訳のための英日データセットです。",
                    "zh-hans": "EaST-MELD是基于MELD的情感感知语音翻译的英日数据集。",
                    "zh-hant": "EaST-MELD是基於MELD的情感感知語音翻譯的英日數據集。"
                }
            },
            "https://github.com/elith-co-jp/meconaudio": {
                "sub_category": null,
                "repository_name": "meconaudio",
                "user_name": "elith-co-jp",
                "description": "Mecon Audio(Medical Conference Audio)は厚生労働省主催の先進医療会議の議事録の読み上げデータセットです。",
                "multilingual_descriptions": {
                    "en": "Mecon Audio (Medical Conference Audio) is a dataset of read-out minutes for advanced medical conferences sponsored by the Ministry of Health, Labour and Welfare.",
                    "ja": "Mecon Audio（メディカル・カンファレンス・オーディオ）は、厚生労働省が主催する先進医療会議の議事録を読み上げるためのデータセットです。",
                    "zh-hans": "Mecon Audio（医疗会议音频）是厚生劳动省主办的先进医疗会议记录的朗读数据集。",
                    "zh-hant": "Mecon Audio（醫學會議音頻）是厚生勞動省主辦的先進醫療會議議事錄的朗讀數據集。"
                }
            },
            "https://github.com/geolonia/japanese-addresses": {
                "sub_category": null,
                "repository_name": "japanese-addresses",
                "user_name": "geolonia",
                "description": "全国の町丁目レベル（277,191件）の住所データのオープンデータ",
                "multilingual_descriptions": {
                    "en": "Open data of address data at the town and block level nationwide (277,191 entries).",
                    "ja": "全国の町丁目レベル（277,191件）の住所データのオープンデータ",
                    "zh-hans": "全国镇街道级别（277,191条）的地址数据开放数据",
                    "zh-hant": "全國的町丁目級別（277,191項）住址數據的開放數據"
                }
            },
            "https://github.com/myokoym/aozorasearch": {
                "sub_category": null,
                "repository_name": "aozorasearch",
                "user_name": "myokoym",
                "description": "The full-text search system for Aozora Bunko by Groonga. 青空文庫全文検索ライブラリ兼Webアプリ。",
                "multilingual_descriptions": {
                    "en": "The full-text search system for Aozora Bunko by Groonga. 青空文庫全文検索ライブラリ兼Webアプリ。",
                    "ja": "グルンガによる青空文庫の全文検索システム。青空文庫全文検索ライブラリ兼Webアプリ。",
                    "zh-hans": "Groonga为青空文库提供的全文搜索系统。",
                    "zh-hant": "Groonga的青空文庫全文檢索系統。青空文庫全文檢索庫兼Web應用程式。"
                }
            },
            "https://github.com/llm-jp/llm-jp-corpus": {
                "sub_category": null,
                "repository_name": "llm-jp-corpus",
                "user_name": "llm-jp",
                "description": "This repository contains scripts to reproduce the LLM-jp corpus.",
                "multilingual_descriptions": {
                    "en": "This repository contains scripts to reproduce the LLM-jp corpus.",
                    "ja": "このリポジトリには、LLM-jpコーパスを再現するためのスクリプトが含まれています。",
                    "zh-hans": "该存储库包含用于重现LLM-jp语料库的脚本。",
                    "zh-hant": "此存儲庫包含重現LLM-jp語料庫的腳本。"
                }
            },
            "https://github.com/shi3z/alpaca_ja": {
                "sub_category": null,
                "repository_name": "alpaca_ja",
                "user_name": "shi3z",
                "description": "alpacaデータセットを日本語化したものです",
                "multilingual_descriptions": {
                    "en": "This is a Japanese version of the alpaca dataset.",
                    "ja": "alpacaデータセットを日本語化したものです",
                    "zh-hans": "这是将alpaca数据集翻译成日语的内容。",
                    "zh-hant": "這是將alpaca數據集翻譯成日文的內容。"
                }
            },
            "https://github.com/megagonlabs/instruction_ja": {
                "sub_category": null,
                "repository_name": "instruction_ja",
                "user_name": "megagonlabs",
                "description": "Japanese instruction data (日本語指示データ)",
                "multilingual_descriptions": {
                    "en": "Japanese instruction data (日本語指示データ)",
                    "ja": "出力",
                    "zh-hans": "日语指示数据",
                    "zh-hant": "日本語指示データ"
                }
            },
            "https://github.com/siikamiika/japanese-family-names": {
                "sub_category": null,
                "repository_name": "japanese-family-names",
                "user_name": "siikamiika",
                "description": "Top 5000 Japanese family names, with readings, ordered by frequency.",
                "multilingual_descriptions": {
                    "en": "Top 5000 Japanese family names, with readings, ordered by frequency.",
                    "ja": "頻度順に並べられた読み付きの上位5000の日本の姓",
                    "zh-hans": "前5000个日本姓氏，附带读音，按频率排序。",
                    "zh-hant": "按頻率排序的前5000個日本姓氏，附帶讀音。"
                }
            },
            "https://github.com/kanjialive/kanji-data-media": {
                "sub_category": null,
                "repository_name": "kanji-data-media",
                "user_name": "kanjialive",
                "description": "Japanese language data on kanji, radicals, media files, fonts and related resources from Kanji alive",
                "multilingual_descriptions": {
                    "en": "Japanese language data on kanji, radicals, media files, fonts and related resources from Kanji alive",
                    "ja": "漢字アライブからの漢字、部首、メディアファイル、フォント、関連リソースに関する日本語データ",
                    "zh-hans": "来自Kanji alive的关于汉字、部首、媒体文件、字体和相关资源的日语语言数据",
                    "zh-hant": "來自Kanji alive的漢字、部首、媒體文件、字體和相關資源的日語語言數據"
                }
            },
            "https://github.com/reazon-research/reazonspeech": {
                "sub_category": null,
                "repository_name": "reazonspeech",
                "user_name": "reazon-research",
                "description": "Construct large-scale Japanese audio corpus at home",
                "multilingual_descriptions": {
                    "en": "Construct large-scale Japanese audio corpus at home",
                    "ja": "自宅で大規模な日本語音声コーパスを構築する",
                    "zh-hans": "在家构建大规模的日语音频语料库",
                    "zh-hant": "在家建立大规模的日语音频语料库"
                }
            },
            "https://github.com/ndl-lab/huriganacorpus-aozora": {
                "sub_category": null,
                "repository_name": "huriganacorpus-aozora",
                "user_name": "ndl-lab",
                "description": "青空文庫及びサピエの点字データから作成した振り仮名のデータセット",
                "multilingual_descriptions": {
                    "en": "Data set of furigana created from Aozora Bunko and Sapie's braille data.",
                    "ja": "青空文庫及びサピエの点字データから作成した振り仮名のデータセット",
                    "zh-hans": "青空文库和Sapie的点字数据创建的假名数据集",
                    "zh-hant": "從青空文庫和Sapie點字數據創建的假名數據集\n從青空文庫及及サピエ的點字數據創建的振り仮名的數據集"
                }
            },
            "https://github.com/koniwa/koniwa": {
                "sub_category": null,
                "repository_name": "koniwa",
                "user_name": "koniwa",
                "description": "An open collection of annotated voices in Japanese language",
                "multilingual_descriptions": {
                    "en": "An open collection of annotated voices in Japanese language",
                    "ja": "日本語のアノテーション付き声のオープンコレクション",
                    "zh-hans": "一个用日语语言注释的开放声音收集",
                    "zh-hant": "一個包含日語註釋聲音的開放收藏。"
                }
            },
            "https://github.com/nlp-waseda/JMMLU": {
                "sub_category": null,
                "repository_name": "JMMLU",
                "user_name": "nlp-waseda",
                "description": "日本語マルチタスク言語理解ベンチマーク Japanese Massive Multitask Language Understanding Benchmark",
                "multilingual_descriptions": {
                    "en": "Japanese Massive Multitask Language Understanding Benchmark",
                    "ja": "日本語マルチタスク言語理解ベンチマーク 日本語巨大マルチタスク言語理解ベンチマーク",
                    "zh-hans": "日本語大规模多任务语言理解基准测试",
                    "zh-hant": "日本語大規模マルチタスク言語理解ベンチマーク"
                }
            },
            "https://github.com/ndl-lab/hurigana-speech-corpus-aozora": {
                "sub_category": null,
                "repository_name": "hurigana-speech-corpus-aozora",
                "user_name": "ndl-lab",
                "description": "青空文庫振り仮名注釈付き音声コーパスのデータセット",
                "multilingual_descriptions": {
                    "en": "Dataset of audio corpus with furigana annotations from Aozora Bunko",
                    "ja": "青空文庫振り仮名注釈付き音声コーパスのデータセット",
                    "zh-hans": "青空文库振り仮名注释附带音频语料库数据集",
                    "zh-hant": "青空文庫振り仮名註釋附音訊語料庫的數據集"
                }
            },
            "https://github.com/hotchpotch/jqara": {
                "sub_category": null,
                "repository_name": "jqara",
                "user_name": "hotchpotch",
                "description": "検索拡張(RAG)評価のための日本語Q&Aデータセット",
                "multilingual_descriptions": {
                    "en": "JQaRA: Japanese Question Answering with Retrieval Augmentation - 検索拡張(RAG)評価のための日本語Q&Aデータセット",
                    "ja": "JQaRA: 検索拡張（RAG）を活用した日本語質問応答データセット",
                    "zh-hans": "JQaRA：具有检索增强功能的日语问答系统 - 用于检索增强（RAG）评估的日语问答数据集",
                    "zh-hant": "JQaRA：具有檢索增強功能的日本問答系統 - 用於檢索增強(RAG)評估的日語問答資料集"
                }
            },
            "https://github.com/aiishii/jemhopqa": {
                "sub_category": null,
                "repository_name": "jemhopqa",
                "user_name": "aiishii",
                "description": "JEMHopQA (Japanese Explainable Multi-hop Question Answering) is a Japanese multi-hop QA dataset that can evaluate internal reasoning.",
                "multilingual_descriptions": {
                    "en": "JEMHopQA (Japanese Explainable Multi-hop Question Answering) is a Japanese multi-hop QA dataset that can evaluate internal reasoning.",
                    "ja": "JEMHopQA（Japanese Explainable Multi-hop Question Answering）は、内部推論を評価できる日本語のマルチホップQAデータセットです。",
                    "zh-hans": "JEMHopQA（日本可解释的多跳问题回答）是一个日本多跳QA数据集，可以评估内部推理。",
                    "zh-hant": "JEMHopQA（日本語説明可能なマルチホップ質問応答）は、内部推論を評価できる日本語マルチホップQAデータセットです。"
                }
            },
            "https://github.com/youmima/jacred": {
                "sub_category": null,
                "repository_name": "jacred",
                "user_name": "youmima",
                "description": "Repository for Japanese Document-level Relation Extraction Dataset (plan to be released in March).",
                "multilingual_descriptions": {
                    "en": "Repository for Japanese Document-level Relation Extraction Dataset (plan to be released in March).",
                    "ja": "日本語文書レベルの関係抽出データセットのリポジトリ（3月にリリース予定）",
                    "zh-hans": "日文文档级关系抽取数据集存储库（计划于三月发布）。",
                    "zh-hant": "用於日文文件級關係提取數據集的存儲庫（計劃在三月份發布）。\n用於日文文件級關係提取數據集的存儲庫（計劃在三月份發布）。"
                }
            },
            "https://github.com/naist-nlp/jades": {
                "sub_category": null,
                "repository_name": "jades",
                "user_name": "naist-nlp",
                "description": "JADES is a dataset for text simplification in Japanese, described in \"JADES: New Text Simplification Dataset in Japanese Targeted at Non-Native Speakers\" (the paper will be available soon).",
                "multilingual_descriptions": {
                    "en": "JADES is a dataset for text simplification in Japanese, described in 'JADES: New Text Simplification Dataset in Japanese Targeted at Non-Native Speakers' (the paper will be available soon).",
                    "ja": "JADESは、日本語のテキスト簡素化のためのデータセットであり、『JADES: New Text Simplification Dataset in Japanese Targeted at Non-Native Speakers』で説明されています（論文は近日中に公開されます）。",
                    "zh-hans": "JADES是一个用于日语文本简化的数据集，详细描述在《JADES: 面向非母语者的日语新文本简化数据集》（论文即将发布）。",
                    "zh-hant": "JADES是一個針對非母語使用者的日文文本簡化數據集，詳細介紹在《JADES:針對非母語使用者的日文新文本簡化數據集》（論文即將發表）。"
                }
            },
            "https://github.com/kunishou/do-not-answer-ja": {
                "sub_category": null,
                "repository_name": "do-not-answer-ja",
                "user_name": "kunishou",
                "description": "2023年8月にメルボルン大学から公開された安全性評価データセット『Do-Not-Answer』を日本語LLMの評価においても使用できるように日本語に自動翻訳し、さらに日本文化も考慮して修正したデータセット。",
                "multilingual_descriptions": {
                    "en": "A safety evaluation dataset \"Do-Not-Answer\" released by the University of Melbourne in August 2023 has been automatically translated into Japanese for use in the evaluation of Japanese LLM, and further modified to take into account Japanese culture.",
                    "ja": "2023年8月にメルボルン大学から公開された安全性評価データセット『Do-Not-Answer』を日本語LLMの評価においても使用できるように日本語に自動翻訳し、さらに日本文化も考慮して修正したデータセット。",
                    "zh-hans": "2023年8月，墨尔本大学发布了安全性评估数据集“Do-Not-Answer”，现在已经将其自动翻译成日语，以便用于评估日语LLM，并根据日本文化进行了修正的数据集。",
                    "zh-hant": "2023年8月，墨爾本大學公開了安全性評估數據集『Do-Not-Answer』，該數據集已經被自動翻譯成日語，並且考慮了日本文化進行了修正，以便在日語LLM評估中使用。"
                }
            },
            "https://github.com/kunishou/oasst1-89k-ja": {
                "sub_category": null,
                "repository_name": "oasst1-89k-ja",
                "user_name": "kunishou",
                "description": "OpenAssistant のオープンソースデータ OASST1 を日本語に翻訳したデータセットになります。",
                "multilingual_descriptions": {
                    "en": "This is a dataset that translates OpenAssistant's open source data OASST1 into Japanese.",
                    "ja": "OpenAssistant のオープンソースデータ OASST1 を日本語に翻訳したデータセットになります。",
                    "zh-hans": "OpenAssistant的开源数据OASST1已被翻译成日语的数据集。",
                    "zh-hant": "OpenAssistant 的開源數據 OASST1 已經被翻譯成日文的數據集。"
                }
            },
            "https://github.com/hotchpotch/jacwir": {
                "sub_category": null,
                "repository_name": "jacwir",
                "user_name": "hotchpotch",
                "description": "日本語情報検索評価のための小規模でカジュアルなWebタイトルと概要のデータセット",
                "multilingual_descriptions": {
                    "en": "JaCWIR: Japanese Casual Web IR Small-scale and casual web title and abstract dataset for Japanese information retrieval evaluation.",
                    "ja": "JaCWIR: Japanese Casual Web IR  日本語情報検索評価のための小規模でカジュアルなWebタイトルと概要のデータセット",
                    "zh-hans": "JaCWIR：日本休闲网络信息检索  用于评估日语信息检索的小型休闲Web标题和摘要数据集",
                    "zh-hant": "JaCWIR: 日本語休閒網路資訊檢索（Web IR） 日本語情報檢索評估的小型休閒Web標題和摘要資料集"
                }
            },
            "https://github.com/laoshubaby/japanese-technical-dict": {
                "sub_category": null,
                "repository_name": "japanese-technical-dict",
                "user_name": "laoshubaby",
                "description": "日本語学習者のための科学技術業界でよく使われる片仮名と元の単語対照表",
                "multilingual_descriptions": {
                    "en": "Comparison table of commonly used katakana and original words in the science and technology industry for Japanese language learners.",
                    "ja": "日本語学習者のための科学技術業界でよく使われる片仮名と元の単語対照表",
                    "zh-hans": "适用于日语学习者的常用片假名和原始单词对照表在科学技术行业中。",
                    "zh-hant": "日本語學習者的科學技術業界常用片假名與原始單字對照表"
                }
            },
            "https://github.com/cl-tohoku/j-unimorph": {
                "sub_category": null,
                "repository_name": "j-unimorph",
                "user_name": "cl-tohoku",
                "description": "Dataset of UniMorph in Japanese",
                "multilingual_descriptions": {
                    "en": "Dataset of UniMorph in Japanese",
                    "ja": "日本語のUniMorphデータセット",
                    "zh-hans": "日语UniMorph数据集",
                    "zh-hant": "UniMorph的日文數據集"
                }
            },
            "https://github.com/riken-grp/GazeVQA": {
                "sub_category": null,
                "repository_name": "GazeVQA",
                "user_name": "riken-grp",
                "description": "Dataset for the LREC-COLING 2024 paper \"A Gaze-grounded Visual Question Answering Dataset for Clarifying Ambiguous Japanese Questions\"",
                "multilingual_descriptions": {
                    "en": "Dataset for the LREC-COLING 2024 paper A Gaze-grounded Visual Question Answering Dataset for Clarifying Ambiguous Japanese Questions",
                    "ja": "LREC-COLING 2024論文用データセット、曖昧な日本語質問を明確にするための視線基準ビジュアル質問応答データセット\nLREC-COLING 2024論文用データセット、曖昧な日本語質問を明確にするための視線基準ビジュアル質問応答データセット",
                    "zh-hans": "LREC-COLING 2024 论文《一个注视引导的视觉问答数据集，用于澄清模糊的日语问题》的数据集",
                    "zh-hant": "LREC-COLING 2024論文的數據集《針對澄清日語問題的凝視導向視覺問答數據集》"
                }
            },
            "https://github.com/riken-grp/J-CRe3": {
                "sub_category": null,
                "repository_name": "J-CRe3",
                "user_name": "riken-grp",
                "description": "Code for J-CRe3 experiments (Ueda et al., LREC-COLING, 2024)",
                "multilingual_descriptions": {
                    "en": "Code for J-CRe3 experiments (Ueda et al., LREC-COLING, 2024)",
                    "ja": "J-CRe3実験のコード（上田ら、LREC-COLING、2024）",
                    "zh-hans": "J-CRe3实验代码（上田等人，LREC-COLING，2024）",
                    "zh-hant": "J-CRe3 實驗代碼（上田等人，LREC-COLING，2024）"
                }
            },
            "https://github.com/sociocom/jmed-llm": {
                "sub_category": null,
                "repository_name": "jmed-llm",
                "user_name": "sociocom",
                "description": "JMED-LLM: Japanese Medical Evaluation Dataset for Large Language Models",
                "multilingual_descriptions": {
                    "en": "JMED-LLM: Japanese Medical Evaluation Dataset for Large Language Models",
                    "ja": "JMED-LLM: 大規模言語モデル向けの日本医学評価データセット",
                    "zh-hans": "JMED-LLM：用于大型语言模型的日本医学评估数据集",
                    "zh-hant": "JMED-LLM：大型語言模型的日本醫學評估數據集"
                }
            },
            "https://github.com/yamachig/lawtext": {
                "sub_category": null,
                "repository_name": "lawtext",
                "user_name": "yamachig",
                "description": "Plain text format for Japanese law",
                "multilingual_descriptions": {
                    "en": "Plain text format for Japanese law",
                    "ja": "日本の法律のプレーンテキスト形式",
                    "zh-hans": "日本法律的纯文本格式\n简体中文",
                    "zh-hant": "日本法律的純文本格式\n日本法律的純文本格式"
                }
            },
            "https://github.com/ndl-lab/pdmocrdataset-part2": {
                "sub_category": null,
                "repository_name": "pdmocrdataset-part2",
                "user_name": "ndl-lab",
                "description": "OCR処理プログラム研究開発事業において作成されたOCR学習用データセット",
                "multilingual_descriptions": {
                    "en": "OCR learning dataset created in OCR processing program research and development project.",
                    "ja": "OCR処理プログラム研究開発事業において作成されたOCR学習用データセット",
                    "zh-hans": "OCR处理程序研究开发项目中创建的OCR学习数据集",
                    "zh-hant": "OCR處理程式研究開發項目中所建立的OCR學習用數據集。"
                }
            },
            "https://github.com/nut-jnlp/japanesetopicwsd": {
                "sub_category": null,
                "repository_name": "japanesetopicwsd",
                "user_name": "nut-jnlp",
                "description": "話題に基づく語義曖昧性解消評価セット",
                "multilingual_descriptions": {
                    "en": "Evaluation set for resolving semantic ambiguity based on topics",
                    "ja": "話題に基づく語義曖昧性解消評価セット",
                    "zh-hans": "基于话题的语义模糊消除评估集合",
                    "zh-hant": "話題基礎的語義模糊解決評估集"
                }
            },
            "https://github.com/tomo-vv/temporalNLI_dataset": {
                "sub_category": null,
                "repository_name": "temporalNLI_dataset",
                "user_name": "tomo-vv",
                "description": "Jamp: Controlled Japanese Temporal Inference Dataset for Evaluating Generalization Capacity of Language Models",
                "multilingual_descriptions": {
                    "en": "Jamp: Controlled Japanese Temporal Inference Dataset for Evaluating Generalization Capacity of Language Models",
                    "ja": "Jamp: 制御された日本語時間推論データセット、言語モデルの汎化能力を評価するため",
                    "zh-hans": "Jamp: 用于评估语言模型泛化能力的受控日语时间推理数据集",
                    "zh-hant": "Jamp：用於評估語言模型泛化能力的受控日語時間推理數據集"
                }
            },
            "https://github.com/DaisukeBekki/JSeM": {
                "sub_category": null,
                "repository_name": "JSeM",
                "user_name": "DaisukeBekki",
                "description": "Japanese semantic test suite (FraCaS counterpart and extensions)",
                "multilingual_descriptions": {
                    "en": "日本語意味テストスイート（FraCaSの対応および拡張）",
                    "ja": "日本語意味テストスイート（FraCaSの対応および拡張）",
                    "zh-hans": "日语语义测试套件（FraCaS对应和扩展）",
                    "zh-hant": "日本語意義測試套件（FraCaS對應及擴展）"
                }
            },
            "https://github.com/mynlp/niilc-qa": {
                "sub_category": null,
                "repository_name": "niilc-qa",
                "user_name": "mynlp",
                "description": "NIILC QA data",
                "multilingual_descriptions": {
                    "en": "NIILC QA data",
                    "ja": "NIILC QAデータ",
                    "zh-hans": "NIILC QA 数据",
                    "zh-hant": "NIILC QA 數據"
                }
            },
            "https://github.com/nlp-waseda/chain-of-thought-ja-dataset": {
                "sub_category": null,
                "repository_name": "chain-of-thought-ja-dataset",
                "user_name": "nlp-waseda",
                "description": "Dataset of paper \"Verification of Chain-of-Thought Prompting in Japanese\"",
                "multilingual_descriptions": {
                    "en": "Dataset of paper Verification of Chain-of-Thought Prompting in Japanese",
                    "ja": "日本語での「Chain-of-Thought Prompting」の論文検証データセット",
                    "zh-hans": "日本论文链式思维提示验证数据集",
                    "zh-hant": "請將以下內容翻譯為繁體中文。\n日本論文《鏈條思維提示的驗證》的數據集"
                }
            },
            "https://github.com/ku-nlp/WikipediaAnnotatedCorpus": {
                "sub_category": null,
                "repository_name": "WikipediaAnnotatedCorpus",
                "user_name": "ku-nlp",
                "description": "This is a Japanese text corpus that consists of Wikipedia articles with various linguistic annotations.",
                "multilingual_descriptions": {
                    "en": "This is a Japanese text corpus that consists of Wikipedia articles with various linguistic annotations.",
                    "ja": "これは、さまざまな言語注釈が付けられたWikipediaの記事からなる日本語テキストコーパスです。",
                    "zh-hans": "这是一个包含维基百科文章和各种语言注释的日语文本语料库。",
                    "zh-hant": "這是一個包含維基百科文章和各種語言標註的日文文本語料庫。"
                }
            },
            "https://github.com/kissge/elaws-history": {
                "sub_category": null,
                "repository_name": "elaws-history",
                "user_name": "kissge",
                "description": "e-Gov 法令検索で配布されている「全ての法令データ」を定期的にダウンロードし、アーカイブしています",
                "multilingual_descriptions": {
                    "en": "We regularly download and archive all legal data distributed through the e-Gov legal search.",
                    "ja": "e-Gov 法令検索で配布されている「全ての法令データ」を定期的にダウンロードし、アーカイブしています",
                    "zh-hans": "通过e-Gov法令搜索定期下载分发的“所有法令数据”，并进行归档。",
                    "zh-hant": "透過 e-Gov 法令檢索平台定期下載並存檔所有法令資料。"
                }
            },
            "https://github.com/Aratako/Japanese-RP-Bench": {
                "sub_category": null,
                "repository_name": "Japanese-RP-Bench",
                "user_name": "Aratako",
                "description": "Japanese-RP-BenchはLLMの日本語ロールプレイ能力を測定するためのベンチマークです。",
                "multilingual_descriptions": {
                    "en": "Japanese-RP-Bench is a benchmark for measuring LLM's Japanese role-playing ability.",
                    "ja": "Japanese-RP-BenchはLLMの日本語ロールプレイ能力を測定するためのベンチマークです。",
                    "zh-hans": "Japanese-RP-Bench是用于衡量LLM的日语角色扮演能力的基准。",
                    "zh-hant": "Japanese-RP-Bench是用來測量LLM的日語角色扮演能力的基準。"
                }
            }
        },
        "Tutorial": {
            "https://github.com/yuibi/spacy_tutorial": {
                "sub_category": null,
                "repository_name": "spacy_tutorial",
                "user_name": "yuibi",
                "description": "spaCy tutorial in English and Japanese. spacy-transformers, BERT, GiNZA.",
                "multilingual_descriptions": {
                    "en": "spaCy tutorial in English and Japanese. spacy-transformers, BERT, GiNZA.",
                    "ja": "spaCyチュートリアルの英語版と日本語版。spacy-transformers、BERT、GiNZA。",
                    "zh-hans": "spaCy教程（英文和日文）。spacy-transformers、BERT、GiNZA。",
                    "zh-hant": "spaCy英文和日文教程。spacy-transformers、BERT、GiNZA。"
                }
            },
            "https://github.com/icoxfog417/fastTextJapaneseTutorial": {
                "sub_category": null,
                "repository_name": "fastTextJapaneseTutorial",
                "user_name": "icoxfog417",
                "description": "Tutorial to train fastText with Japanese corpus",
                "multilingual_descriptions": {
                    "en": "Tutorial to train fastText with Japanese corpus",
                    "ja": "日本語コーパスを使用してfastTextをトレーニングするチュートリアル",
                    "zh-hans": "使用日语语料库训练fastText的教程",
                    "zh-hant": "使用日語語料庫訓練fastText的教程"
                }
            },
            "https://github.com/shunk031/allennlp-NER-ja": {
                "sub_category": null,
                "repository_name": "allennlp-NER-ja",
                "user_name": "shunk031",
                "description": "AllenNLP-NER-ja: AllenNLP による日本語を対象とした固有表現抽出",
                "multilingual_descriptions": {
                    "en": "AllenNLP-NER-ja: Named Entity Recognition for Japanese using AllenNLP",
                    "ja": "AllenNLP-NER-ja：AllenNLPによる日本語固有表現抽出",
                    "zh-hans": "AllenNLP-NER-ja：使用AllenNLP进行针对日语的命名实体识别。",
                    "zh-hant": "AllenNLP-NER-ja：使用AllenNLP進行針對日語的專有名詞識別。"
                }
            },
            "https://github.com/ymym3412/chariot-PyTorch-Japanese-text-classification": {
                "sub_category": null,
                "repository_name": "chariot-PyTorch-Japanese-text-classification",
                "user_name": "ymym3412",
                "description": "Experiment for Japanese Text classification using chariot and PyTorch",
                "multilingual_descriptions": {
                    "en": "Experiment for Japanese Text classification using chariot and PyTorch",
                    "ja": "ChariotとPyTorchを使用した日本語テキスト分類の実験",
                    "zh-hans": "使用 chariot 和 PyTorch 进行日语文本分类的实验",
                    "zh-hant": "使用 chariot 和 PyTorch 进行日文文本分类的实验"
                }
            },
            "https://github.com/poyo46/ginza-examples": {
                "sub_category": null,
                "repository_name": "ginza-examples",
                "user_name": "poyo46",
                "description": "日本語NLPライブラリGiNZAのすゝめ",
                "multilingual_descriptions": {
                    "en": "Introduction to the Japanese NLP library GiNZA",
                    "ja": "日本語NLPライブラリGiNZAのすゝめ",
                    "zh-hans": "推荐日语NLP库GiNZA",
                    "zh-hant": "日本語NLP程式庫GiNZA的推薦"
                }
            },
            "https://github.com/nekoumei/DocumentClassificationUsingBERT-Japanese": {
                "sub_category": null,
                "repository_name": "DocumentClassificationUsingBERT-Japanese",
                "user_name": "nekoumei",
                "description": "DocumentClassificationUsingBERT-Japanese",
                "multilingual_descriptions": {
                    "en": "DocumentClassificationUsingBERT-Japanese",
                    "ja": "ドキュメント分類にBERTを使用する-日本語",
                    "zh-hans": "使用BERT进行文档分类-日语",
                    "zh-hant": "使用BERT進行文件分類-日文"
                }
            },
            "https://github.com/YutaroOgawa/BERT_Japanese_Google_Colaboratory": {
                "sub_category": null,
                "repository_name": "BERT_Japanese_Google_Colaboratory",
                "user_name": "YutaroOgawa",
                "description": "Google Colaboratoryで日本語のBERTを動かす方法です。",
                "multilingual_descriptions": {
                    "en": "Google Colaboratoryで日本語のBERTを動かす方法です。",
                    "ja": "Google Colaboratoryで日本語のBERTを動かす方法です。",
                    "zh-hans": "这是在Google Colaboratory上运行日语BERT的方法。",
                    "zh-hant": "這是在 Google Colaboratory 上運行日本語 BERT 的方法。"
                }
            },
            "https://github.com/stockmarkteam/bert-book": {
                "sub_category": null,
                "repository_name": "bert-book",
                "user_name": "stockmarkteam",
                "description": "「BERTによる自然言語処理入門: Transformersを使った実践プログラミング」サポートページ",
                "multilingual_descriptions": {
                    "en": "\"Introduction to Natural Language Processing with BERT: Practical Programming using Transformers\" Support Page.",
                    "ja": "「BERTによる自然言語処理入門: Transformersを使った実践プログラミング」サポートページ",
                    "zh-hans": "“BERT自然语言处理入门：使用Transformers的实践编程”支持页面",
                    "zh-hant": "「BERT自然語言處理入門：使用Transformers的實踐編程」支援頁面"
                }
            },
            "https://github.com/mocobeta/janome-tutorial": {
                "sub_category": null,
                "repository_name": "janome-tutorial",
                "user_name": "mocobeta",
                "description": "Janome を使ったテキストマイニング入門チュートリアルです。",
                "multilingual_descriptions": {
                    "en": "This is an introductory tutorial on text mining using Janome.",
                    "ja": "Janome を使ったテキストマイニング入門チュートリアルです。",
                    "zh-hans": "这是一个使用Janome进行文本挖掘的入门教程。",
                    "zh-hant": "這是使用Janome進行文本探勘的入門教程。"
                }
            },
            "https://github.com/hnishi/handson-language-models": {
                "sub_category": null,
                "repository_name": "handson-language-models",
                "user_name": "hnishi",
                "description": "日本語の言語モデルのハンズオン資料です",
                "multilingual_descriptions": {
                    "en": "This is a hands-on material for a Japanese language model.",
                    "ja": "日本語の言語モデルのハンズオン資料です",
                    "zh-hans": "这是关于日语语言模型的实践资料。",
                    "zh-hant": "這是日語語言模型的實作指南資料。"
                }
            },
            "https://github.com/verypluming/JapaneseNLI": {
                "sub_category": null,
                "repository_name": "JapaneseNLI",
                "user_name": "verypluming",
                "description": "Google Colabで日本語テキスト推論を試す",
                "multilingual_descriptions": {
                    "en": "Trying Japanese text inference on Google Colab.",
                    "ja": "Google Colabで日本語テキスト推論を試す",
                    "zh-hans": "在Google Colab上尝试日语文本推理。",
                    "zh-hant": "嘗試在Google Colab進行日文文本推論。"
                }
            },
            "https://github.com/Gin5050/deep-learning-with-pytorch-ja": {
                "sub_category": null,
                "repository_name": "deep-learning-with-pytorch-ja",
                "user_name": "Gin5050",
                "description": "deep-learning-with-pytorchの日本語版repositoryです。",
                "multilingual_descriptions": {
                    "en": "deep-learning-with-pytorchの日本語版repositoryです。",
                    "ja": "deep-learning-with-pytorchの日本語版リポジトリです。",
                    "zh-hans": "这是deep-learning-with-pytorch的日文版存储库。",
                    "zh-hant": "這是 deep-learning-with-pytorch 的日文版 repository。"
                }
            },
            "https://github.com/python-nlp-book/python-nlp-book": {
                "sub_category": null,
                "repository_name": "python-nlp-book",
                "user_name": "python-nlp-book",
                "description": "ディープラーニングによる自然言語処理（共立出版）のサポートページです",
                "multilingual_descriptions": {
                    "en": "This is the support page for \"Natural Language Processing with Deep Learning\" (published by Kyoritsu Shuppan)",
                    "ja": "ディープラーニングによる自然言語処理（共立出版）のサポートページです",
                    "zh-hans": "这是《自然语言处理：基于深度学习》（共立出版社）的支持页面。",
                    "zh-hant": "透過深度學習的自然語言處理（共立出版）支援頁面。"
                }
            },
            "https://github.com/ghmagazine/llm-book": {
                "sub_category": null,
                "repository_name": "llm-book",
                "user_name": "ghmagazine",
                "description": "「大規模言語モデル入門」（技術評論社, 2023）のGitHubリポジトリ",
                "multilingual_descriptions": {
                    "en": "GitHub repository for \"Introduction to Large-scale Language Models\" (Gijutsu-Hyoronsha, 2023)",
                    "ja": "「大規模言語モデル入門」（技術評論社, 2023）のGitHubリポジトリ",
                    "zh-hans": "「大规模语言模型入门」（技术评论社，2023）的GitHub仓库",
                    "zh-hant": "「大規模言語模型入門」（技術評論社，2023）的GitHub存儲庫"
                }
            },
            "https://github.com/hiroshi-matsuda-rit/nlp2024-tutorial-3": {
                "sub_category": null,
                "repository_name": "nlp2024-tutorial-3",
                "user_name": "hiroshi-matsuda-rit",
                "description": "環境構築手順とソースコード",
                "multilingual_descriptions": {
                    "en": "NLP2024 Tutorial 3 Creating and Learning a Large-Scale Japanese Language Model - Environment Setup Procedure and Source Code",
                    "ja": "NLP2024 チュートリアル３ 作って学ぶ日本語大規模言語モデル - 環境構築手順とソースコード",
                    "zh-hans": "NLP2024 教程3 制作和学习日语大规模语言模型 - 环境搭建步骤和源代码",
                    "zh-hant": "NLP2024 教程三 創建並學習日語大規模語言模型 - 環境構建步驟與源代碼"
                }
            },
            "https://github.com/mpkato/japanese-ir-tutorial": {
                "sub_category": null,
                "repository_name": "japanese-ir-tutorial",
                "user_name": "mpkato",
                "description": "日本語情報検索チュートリアル",
                "multilingual_descriptions": {
                    "en": "Japanese Information Retrieval Tutorial",
                    "ja": "日本語情報検索チュートリアル",
                    "zh-hans": "日本语信息检索教程",
                    "zh-hant": "日本語資訊檢索教學"
                }
            },
            "https://github.com/mamorlis/nlpbook": {
                "sub_category": null,
                "repository_name": "nlpbook",
                "user_name": "mamorlis",
                "description": "「自然言語処理の教科書」サポートサイト",
                "multilingual_descriptions": {
                    "en": "\"Natural Language Processing Textbook\" Support Site",
                    "ja": "「自然言語処理の教科書」サポートサイト",
                    "zh-hans": "\"自然语言处理教科书\"支持网站",
                    "zh-hant": "「自然語言處理教科書」支援網站"
                }
            },
            "https://github.com/makenowjust/kantan-regex-book": {
                "sub_category": null,
                "repository_name": "kantan-regex-book",
                "user_name": "makenowjust",
                "description": "作って学ぶ正規表現エンジン",
                "multilingual_descriptions": {
                    "en": "Regular Expression Engine for Creating and Learning",
                    "ja": "作って学ぶ正規表現エンジン",
                    "zh-hans": "制作并学习正则表达式引擎",
                    "zh-hant": "製作並學習正規表達式引擎"
                }
            },
            "https://github.com/hpprc/bert-classification-tutorial-2024": {
                "sub_category": null,
                "repository_name": "bert-classification-tutorial-2024",
                "user_name": "hpprc",
                "description": "【2024年版】BERTによるテキスト分類",
                "multilingual_descriptions": {
                    "en": "Text classification using BERT in the 2024 version",
                    "ja": "【2024年版】BERTによるテキスト分類",
                    "zh-hans": "【2024年版】基于BERT的文本分类",
                    "zh-hant": "【2024年版】BERT進行文本分類"
                }
            },
            "https://github.com/qianniu95/gemma2_2b_finetune_jp_tutorial/blob/main/Gemma2_2b_Japanese_finetuning_colab.ipynb": {
                "sub_category": null,
                "repository_name": "Gemma2_2b_Japanese_finetuning_colab.ipynb",
                "user_name": "main",
                "description": "Fine-Tuning Google Gemma for Japanese Instructions",
                "multilingual_descriptions": {
                    "en": "Fine-Tuning Google Gemma for Japanese Instructions",
                    "ja": "Google Gemmaの日本語の説明のためのファインチューニング",
                    "zh-hans": "对Google Gemma进行日语指令的微调",
                    "zh-hant": "將Google Gemma微調為日文指令"
                }
            },
            "https://github.com/upura/nlp100v2020": {
                "sub_category": null,
                "repository_name": "nlp100v2020",
                "user_name": "upura",
                "description": "「言語処理100本ノック 2020」をPythonで解く",
                "multilingual_descriptions": {
                    "en": "Solving \"Language Processing 100 Knock 2020\" with Python",
                    "ja": "「言語処理100本ノック 2020」をPythonで解く",
                    "zh-hans": "用Python解决“自然语言处理100道题目2020”",
                    "zh-hant": "用Python解决“自然语言处理100道题目2020”"
                }
            }
        },
        "Research summary": {
            "https://github.com/himkt/awesome-bert-japanese": {
                "sub_category": null,
                "repository_name": "awesome-bert-japanese",
                "user_name": "himkt",
                "description": "A list of pre-trained BERT models for Japanese with word/subword tokenization + vocabulary construction algorithm information",
                "multilingual_descriptions": {
                    "en": "A list of pre-trained BERT models for Japanese with word/subword tokenization + vocabulary construction algorithm information",
                    "ja": "日本語の事前学習済みBERTモデルのリストと、単語/サブワードトークン化+語彙構築アルゴリズム情報。",
                    "zh-hans": "一个预训练的BERT模型列表，包括日语的单词/子词分词和词汇构建算法信息。",
                    "zh-hant": "一份預先訓練的BERT模型清單，包括日語的單詞/子詞分詞和詞彙構建算法信息。"
                }
            },
            "https://github.com/gotutiyan/GEC-Info-ja": {
                "sub_category": null,
                "repository_name": "GEC-Info-ja",
                "user_name": "gotutiyan",
                "description": "文法誤り訂正に関する日本語文献を収集・分類するためのリポジトリ",
                "multilingual_descriptions": {
                    "en": "Repository for collecting and categorizing Japanese literature on correcting grammar errors.",
                    "ja": "文法誤り訂正に関する日本語文献を収集・分類するためのリポジトリ",
                    "zh-hans": "收集和分类有关日语文法错误修正的文献的存储库。",
                    "zh-hant": "收集和分类有关日语文法错误修正的文献的存储库"
                }
            },
            "https://github.com/ikegami-yukino/dataset-list": {
                "sub_category": null,
                "repository_name": "dataset-list",
                "user_name": "ikegami-yukino",
                "description": "lists of text corpus and more (mainly Japanese)",
                "multilingual_descriptions": {
                    "en": "lists of text corpus and more (mainly Japanese)",
                    "ja": "テキストコーパスなどのリスト（主に日本語）",
                    "zh-hans": "文本语料库列表和更多（主要是日语）",
                    "zh-hant": "文本語料庫列表及更多（主要為日語）"
                }
            },
            "https://github.com/Valkyrja3607/tuning_playbook_ja": {
                "sub_category": null,
                "repository_name": "tuning_playbook_ja",
                "user_name": "Valkyrja3607",
                "description": "ディープラーニングモデルの性能を体系的に最大化するためのプレイブック",
                "multilingual_descriptions": {
                    "en": "A playbook for systematically maximizing the performance of deep learning models.",
                    "ja": "ディープラーニングモデルの性能を体系的に最大化するためのプレイブック",
                    "zh-hans": "深度学习模型性能最大化的系统指南",
                    "zh-hant": "系統地最大化深度學習模型性能的策略手冊"
                }
            },
            "https://github.com/olety/japanese-pitch-accent-resources": {
                "sub_category": null,
                "repository_name": "japanese-pitch-accent-resources",
                "user_name": "olety",
                "description": "Trying to consolidate japanese phonetic, and in particular pitch accent resources into one list",
                "multilingual_descriptions": {
                    "en": "Trying to consolidate japanese phonetic, and in particular pitch accent resources into one list",
                    "ja": "日本語の音声、特にアクセントに関するリソースを一つのリストにまとめようとしています。",
                    "zh-hans": "尝试将日语音标，特别是声调资源整合成一个列表。",
                    "zh-hant": "嘗試將日語音韻，特別是音高重音資源整合成一個清單。"
                }
            },
            "https://github.com/llm-jp/awesome-japanese-llm": {
                "sub_category": null,
                "repository_name": "awesome-japanese-llm",
                "user_name": "llm-jp",
                "description": "オープンソースの日本語LLMまとめ",
                "multilingual_descriptions": {
                    "en": "Summary of Japanese LLM (Open Source)",
                    "ja": "オープンソースの日本語LLMまとめ",
                    "zh-hans": "开源的日语LLM总结",
                    "zh-hant": "開源的日本語LLM總結"
                }
            }
        }
    }
}