|
94 | 94 | # Spacy model
|
95 | 95 | # Spacy 模型
|
96 | 96 | SPACY_MODEL_MAP = {
|
97 |
| - "en": "en_core_web_sm", |
98 |
| - "zh": "zh_core_web_sm", |
99 |
| - "es": "es_core_news_lg", |
100 |
| - "fr": "fr_core_news_lg", |
101 |
| - "de": "de_core_news_lg", |
102 |
| - "it": "it_core_news_lg", |
103 |
| - "ja": "ja_core_news_lg", |
104 |
| - "pt": "pt_core_news_lg", |
105 |
| - "nl": "nl_core_news_lg", |
106 |
| - "el": "el_core_news_lg", |
107 |
| - "ru": "ru_core_news_lg", |
108 |
| - "ar": "ar_core_news_lg", |
109 |
| - "hi": "hi_core_news_lg", |
110 |
| - "ko": "ko_core_news_lg", |
111 |
| - "pl": "pl_core_news_lg", |
112 |
| - "uk": "uk_core_news_lg", |
113 |
| - "vi": "vi_core_news_lg", |
114 |
| - "tr": "tr_core_news_lg", |
115 |
| - "th": "th_core_news_lg", |
116 |
| - "ro": "ro_core_news_lg", |
117 |
| - "da": "da_core_news_lg", |
118 |
| - "fi": "fi_core_news_lg", |
119 |
| - "hu": "hu_core_news_lg", |
120 |
| - "nb": "nb_core_news_lg", |
121 |
| - "sv": "sv_core_news_lg" |
| 97 | + "en": "en_core_web_md", |
| 98 | + "ru": "ru_core_news_md", |
| 99 | + "fr": "fr_core_news_md", |
| 100 | + |
| 101 | + # "es": "es_core_news_md", |
| 102 | + # "de": "de_core_news_md", |
| 103 | + # "it": "it_core_news_md", |
| 104 | + |
| 105 | + |
| 106 | + # Not supported |
| 107 | + # "zh": "zh_core_web_md", |
| 108 | + # "ja": "ja_core_news_md", |
122 | 109 | }
|
123 | 110 |
|
| 111 | + |
124 | 112 | # 使用空格分割的语言
|
125 | 113 | # Languages that split with space
|
126 | 114 | LANGUAGE_SPLIT_WITH_SPACE = ['en', 'es', 'fr', 'de', 'it', 'pt', 'nl', 'el', 'ru', 'ar', 'hi', 'pl', 'uk', 'vi', 'tr', 'ro', 'da', 'fi', 'hu', 'nb', 'sv']
|
|
0 commit comments