From 8d163cb26ffa886c85d25c59ed6361def938eefc Mon Sep 17 00:00:00 2001 From: xxyzz Date: Thu, 24 Oct 2024 17:08:41 +0800 Subject: [PATCH] =?UTF-8?q?[ko]=20translate=20Korean=20tags=20and=20topics?= =?UTF-8?q?=20data=20in=20"=EB=AA=A8=EB=93=88:labels/data"?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit many data in these Lua files are copied from en edition and not translated to Korean --- src/wiktextract/extractor/ko/tags.py | 29 ++++++++++++++++++++++++++++ 1 file changed, 29 insertions(+) diff --git a/src/wiktextract/extractor/ko/tags.py b/src/wiktextract/extractor/ko/tags.py index 52bf9a78..0489d36b 100644 --- a/src/wiktextract/extractor/ko/tags.py +++ b/src/wiktextract/extractor/ko/tags.py @@ -3,14 +3,43 @@ # https://ko.wiktionary.org/wiki/모듈:labels/data/topical # https://ko.wiktionary.org/wiki/모듈:labels/data GLOSS_TAGS = { + "인명": "name", "고어": "archaic", + "구식": "archaic", + # "대명동사": "", + # "말고름": "", + "비유": "metaphoric", + "사어": "obsolete", # dead language + "유아어": "baby-talk", "자동사": "intransitive", + "직역": "literally", + "타동사": "transitive", } TAGS = {**GLOSS_TAGS} TOPICS = { "금융": "finance", + "광고": "advertising", + "군사": "military", + "어류": "fish", + "물리": "physics", + "법률": "law", + "식물": "botany", + "역사": "history", + "의류": "clothing", + "의학": "medicine", + "전기": "electricity", + # "조류": "birds", + "지리": "geography", + "프로그래밍": "programming", + "컴퓨터": "computer", + "해부학": "anatomy", + "정치": "politics", + "종교": "religion", + "가톨릭": "Catholicism", + "축구": "football", + # "체육": "physical-education", }