File tree Expand file tree Collapse file tree 6 files changed +16
-11
lines changed Expand file tree Collapse file tree 6 files changed +16
-11
lines changed Original file line number Diff line number Diff line change 13
13
PMT1_DEP_ELECTRA_SMALL = HANLP_URL + 'dep/pmt_dep_electra_small_20220218_134518.zip'
14
14
'Electra small encoder (:cite:`clark2020electra`) with Biaffine decoder (:cite:`dozat:17a`) trained on PKU ' \
15
15
'Multi-view Chinese Treebank (PMT) 1.0 (:cite:`qiu-etal-2014-multi`). Performance is UAS=87.68% LAS=83.54%.'
16
+ CTB9_UDC_ELECTRA_SMALL = HANLP_URL + 'dep/udc_dep_electra_small_20220218_095452.zip'
17
+ 'Electra small encoder (:cite:`clark2020electra`) with Biaffine decoder (:cite:`dozat:17a`) trained on CTB9-UD420. ' \
18
+ 'Performance is UAS=85.92% LAS=81.13% .'
16
19
17
20
PTB_BIAFFINE_DEP_EN = HANLP_URL + 'dep/ptb_dep_biaffine_20200101_174624.zip'
18
21
'Biaffine LSTM model (:cite:`dozat:17a`) trained on PTB.'
Original file line number Diff line number Diff line change 16
16
CTB9_POS_RADICAL_ELECTRA_SMALL = HANLP_URL + 'pos/pos_ctb_radical_electra_small_20220215_111932.zip'
17
17
'Electra small model (:cite:`clark2020electra`) with radical embeddings (:cite:`he2018dual`) trained on CTB9 (:cite:`https://doi.org/10.35111/gvd0-xk91`). Accuracy = `96.14`.'
18
18
19
- C863_POS_ELECTRA_SMALL = HANLP_URL + 'pos/pos_863_electra_small_20210808_124848.zip'
20
- 'Electra small model (:cite:`clark2020electra`) trained on Chinese 863 corpus. Accuracy = `95.22`.'
19
+ C863_POS_ELECTRA_SMALL = HANLP_URL + 'pos/pos_863_electra_small_20220217_101958.zip'
20
+ 'Electra small model (:cite:`clark2020electra`) trained on Chinese 863 corpus. Accuracy = `95.19`.'
21
+ PKU_POS_ELECTRA_SMALL = HANLP_URL + 'pos/pos_pku_electra_small_20220217_142436.zip'
22
+ 'Electra small model (:cite:`clark2020electra`) trained on Chinese PKU corpus. Accuracy = `97.55`.'
21
23
22
24
PKU98_POS_ELECTRA_SMALL = HANLP_URL + 'pos/pos_pku_electra_small_20210808_125158.zip'
23
25
'Electra small model (:cite:`clark2020electra`) trained on CTB9 (:cite:`https://doi.org/10.35111/gvd0-xk91`). Accuracy = `97.60`.'
Original file line number Diff line number Diff line change 8
8
SEMEVAL16_TEXT_BIAFFINE_ZH = HANLP_URL + 'sdp/semeval16-text-biaffine_20200101_002257.zip'
9
9
'Biaffine SDP (:cite:`he-choi-2019`) trained on SemEval16 text data.'
10
10
11
- SEMEVAL16_ALL_ELECTRA_SMALL_ZH = HANLP_URL + 'sdp/semeval16_sdp_electra_small_20220208_122026 .zip'
12
- 'Biaffine SDP (:cite:`he-choi-2019`) trained on SemEval16 text and news data.'
11
+ SEMEVAL16_ALL_ELECTRA_SMALL_ZH = HANLP_URL + 'sdp/semeval16_sdp_electra_small_20220218_140116 .zip'
12
+ 'Biaffine SDP (:cite:`he-choi-2019`) trained on SemEval16 text and news data. UF=80.82% LF=70.02%. '
13
13
14
14
SEMEVAL15_PAS_BIAFFINE_EN = HANLP_URL + 'sdp/semeval15_biaffine_pas_20200103_152405.zip'
15
15
'Biaffine SDP (:cite:`he-choi-2019`) trained on SemEval15 PAS data.'
Original file line number Diff line number Diff line change 3
3
# Date: 2021-08-07 19:07
4
4
from hanlp_common .constant import HANLP_URL
5
5
6
- CPB3_SRL_ELECTRA_SMALL = HANLP_URL + 'srl/cpb3_electra_small_crf_20210807_190553 .zip'
7
- 'Electra small model (:cite:`clark2020electra`) trained on CPB3. F1 = ` 76.53` .'
6
+ CPB3_SRL_ELECTRA_SMALL = HANLP_URL + 'srl/cpb3_electra_small_crf_has_transform_20220218_135910 .zip'
7
+ 'Electra small model (:cite:`clark2020electra`) trained on CPB3. P=75.87% R=76.24% F1= 76.05% .'
8
8
9
9
ALL = {}
Original file line number Diff line number Diff line change 15
15
'ALBERT model (:cite:`Lan2020ALBERT:`) trained on the largest CWS dataset in the world.'
16
16
SIGHAN2005_PKU_BERT_BASE_ZH = HANLP_URL + 'tok/sighan2005_pku_bert_base_zh_20201231_141130.zip'
17
17
'BERT model (:cite:`devlin-etal-2019-bert`) trained on sighan2005 pku dataset.'
18
- COARSE_ELECTRA_SMALL_ZH = HANLP_URL + 'tok/coarse_electra_small_zh_20210603_112321 .zip'
19
- 'Electra (:cite:`clark2020electra`) small model trained on coarse-grained CWS corpora. Its performance is P=97.08 % R=96.94 % F1=97.01 % which is ' \
18
+ COARSE_ELECTRA_SMALL_ZH = HANLP_URL + 'tok/coarse_electra_small_20220218_100557 .zip'
19
+ 'Electra (:cite:`clark2020electra`) small model trained on coarse-grained CWS corpora. Its performance is P=96.97 % R=96.87 % F1=96.92 % which is ' \
20
20
'much higher than that of MTL model '
21
- FINE_ELECTRA_SMALL_ZH = HANLP_URL + 'tok/fine_tok_electra_small_20220205_185926 .zip'
22
- 'Electra (:cite:`clark2020electra`) small model trained on fine-grained CWS corpora. Its performance is P=97.72 % R=97.67 % F1=97.69% which is ' \
21
+ FINE_ELECTRA_SMALL_ZH = HANLP_URL + 'tok/fine_electra_small_20220217_190117 .zip'
22
+ 'Electra (:cite:`clark2020electra`) small model trained on fine-grained CWS corpora. Its performance is P=97.44 % R=97.40 % F1=97.42% which is ' \
23
23
'much higher than that of MTL model '
24
24
CTB9_TOK_ELECTRA_SMALL = HANLP_URL + 'tok/ctb9_electra_small_20220215_205427.zip'
25
25
'Electra (:cite:`clark2020electra`) small model trained on CTB9. Its performance is P=97.15% R=97.36% F1=97.26% which is ' \
Original file line number Diff line number Diff line change 2
2
# Author: hankcs
3
3
# Date: 2019-12-28 19:26
4
4
5
- __version__ = '2.1.0-beta.15 '
5
+ __version__ = '2.1.0-beta.16 '
6
6
"""HanLP version"""
7
7
8
8
You can’t perform that action at this time.
0 commit comments