Entry Li:2011:MEC from talip.bib
Last update: Sun Oct 15 02:55:04 MDT 2017
Top |
Symbols |
Numbers |
Math |
A |
B |
C |
D |
E |
F |
G |
H |
I |
J |
K |
L |
M |
N |
O |
P |
Q |
R |
S |
T |
U |
V |
W |
X |
Y |
Z
BibTeX entry
@Article{Li:2011:MEC,
author = "Lishuang Li and Peng Wang and Degen Huang and Lian
Zhao",
title = "Mining {English--Chinese} Named Entity Pairs from
Comparable Corpora",
journal = j-TALIP,
volume = "10",
number = "4",
pages = "19:1--19:??",
month = dec,
year = "2011",
CODEN = "????",
DOI = "https://doi.org/10.1145/2025384.2025387",
ISSN = "1530-0226 (print), 1558-3430 (electronic)",
ISSN-L = "1530-0226",
bibdate = "Thu Dec 15 09:23:26 MST 2011",
bibsource = "http://portal.acm.org/;
http://www.math.utah.edu/pub/tex/bib/talip.bib",
abstract = "Bilingual Named Entity (NE) pairs are valuable
resources for many NLP applications. Since comparable
corpora are more accessible, abundant and up-to-date,
recent researches have concentrated on mining bilingual
lexicons using comparable corpora. Leveraging
comparable corpora, this research presents a novel
approach to mining English-Chinese NE translations by
combining multi-dimension features from various
information sources for every possible NE pair, which
include the transliteration model, English-Chinese
matching, Chinese-English matching, translation model,
length, and context vector. These features are
integrated into one model with linear combination and
minimum sample risk (MSR) algorithm. As for the high
type-dependence of NE translation, we integrate
different features according to different NE types.",
acknowledgement = ack-nhfb,
articleno = "19",
fjournal = "ACM Transactions on Asian Language Information
Processing",
journal-URL = "http://portal.acm.org/browse_dl.cfm?&idx=J820",
}
Related entries
- according,
5(2)146,
5(2)165,
6(2)7,
7(2)7,
7(4)11,
8(1)3,
8(2)7,
9(2)6,
10(1)3,
12(4)17,
13(2)9
- algorithm,
1(4)281,
5(2)165,
6(3)11,
6(4)2,
6(4)3,
7(1)3,
7(2)7,
7(3)8,
7(3)10,
7(4)12,
8(1)4,
8(3)12,
9(1)3,
9(1)4,
10(2)7,
10(2)9,
10(2)10,
11(1)3,
11(2)4,
11(2)7,
11(3)9,
11(3)11,
11(4)14,
12(1)1,
12(1)2,
12(2)6,
13(1)4,
13(3)13,
13(4)18
- application,
1(2)103,
4(4)475,
6(2)7,
6(4)2,
7(1)2,
7(2)7,
7(3)8,
7(4)11,
7(4)13,
8(2)7,
8(2)9,
8(3)10,
8(4)14,
9(2)7,
9(4)13,
10(2)10,
11(4)17,
12(3)11
- bilingual,
4(2)78,
5(2)89,
5(2)121,
6(3)11,
7(1)1,
8(2)9,
10(3)16,
11(2)6,
12(3)9
- Chinese, English-,
6(2)6,
7(2)5
- Chinese-English,
10(4)18
- combination,
3(2)113,
4(3)340,
6(4)3,
8(1)4,
8(2)6,
8(4)16,
9(3)12,
10(3)12,
10(3)15,
11(4)17,
12(2)5,
12(2)7,
12(4)14,
13(2)9
- combining,
1(4)297,
6(3)11,
6(4)3,
7(4)13,
8(2)6,
8(3)11,
10(3)16,
11(4)15,
12(2)7
- comparable,
6(3)11,
11(2)6,
12(3)9,
12(3)12,
13(4)17
- context,
6(4)2,
8(4)15,
9(2)7,
9(4)14,
10(1)3,
10(4)18,
11(2)6,
11(2)7,
11(3)9,
12(1)2,
13(1)2
- corpora,
5(2)89,
5(2)121,
6(2)6,
6(3)11,
7(2)6,
9(2)5,
9(4)13,
10(3)15,
10(4)21,
11(2)6,
11(2)7,
11(3)11,
12(2)7,
13(1)1,
13(1)3,
13(2)9,
13(3)11
- different,
5(2)89,
6(3)9,
6(4)3,
7(2)7,
7(3)8,
7(4)13,
8(1)2,
8(2)7,
8(2)8,
8(3)11,
8(4)16,
8(4)17,
9(1)1,
9(1)4,
9(2)5,
9(2)6,
9(3)12,
10(1)4,
10(1)5,
10(3)12,
10(4)17,
11(3)8,
11(3)11,
11(4)16,
11(4)17,
11(4)18,
12(1)2,
12(3)11,
12(4)17,
13(2)6,
13(3)11,
13(4)16
- English, Chinese-,
1(2)103,
4(2)57,
8(2)7,
8(4)17,
10(4)17,
10(4)18,
13(1)2
- English--Chinese,
6(2)6,
7(2)5
- entity,
2(2)124,
2(3)290,
5(1)4,
5(2)121,
6(4)3,
7(1)1,
9(4)15,
10(2)9,
10(3)14,
10(3)15,
11(1)2,
11(3)11,
12(3)10
- every,
11(1)2
- feature,
2(3)290,
5(2)165,
6(4)1,
7(2)6,
7(2)7,
7(3)10,
7(4)13,
8(3)11,
8(4)14,
8(4)17,
9(1)2,
9(2)5,
9(2)6,
10(1)5,
10(1)6,
10(2)7,
10(3)13,
10(3)15,
10(4)17,
10(4)21,
11(3)10,
11(4)14,
11(4)16,
12(1)1,
12(1)4,
12(3)9,
12(3)10,
13(2)9,
13(3)13,
13(4)16
- have,
5(2)121,
6(3)10,
6(4)2,
7(2)7,
7(3)8,
7(4)11,
7(4)12,
7(4)13,
8(2)8,
8(2)9,
8(4)14,
8(4)16,
8(4)17,
8(4)18,
9(1)1,
9(1)3,
9(2)7,
9(4)15,
10(1)5,
10(2)7,
10(4)20,
10(4)21,
11(1)2,
11(2)6,
11(3)8,
12(1)3,
12(2)6,
13(1)3,
13(2)6,
13(2)7,
13(2)9,
13(3)11,
13(3)12
- high,
8(3)10,
10(1)2,
10(1)6,
10(2)7,
11(3)11,
12(1)4,
12(3)9,
12(3)10,
12(3)11,
13(1)1,
13(1)3,
13(3)12
- include,
7(3)8,
8(2)9,
9(4)15,
10(1)2,
11(2)7,
12(3)10,
13(2)7
- information,
1(1)65,
1(1)83,
1(4)281,
2(3)245,
2(3)295,
3(1)1,
3(4)227,
4(2)57,
4(2)78,
4(3)243,
4(3)357,
4(4)375,
4(4)475,
5(1)44,
5(2)89,
5(3)264,
5(4)291,
5(4)296,
5(4)323,
6(2)7,
6(4)2,
7(1)2,
7(1)3,
7(2)5,
7(3)8,
7(4)12,
8(1)2,
8(1)3,
8(3)10,
8(3)11,
8(4)15,
8(4)16,
8(4)17,
9(1)1,
9(2)7,
9(3)9,
9(3)10,
9(3)11,
9(3)12,
9(4)13,
9(4)14,
9(4)15,
10(2)8,
10(2)10,
10(3)15,
10(3)16,
10(4)20,
10(4)21,
11(1)2,
11(2)6,
11(2)7,
11(4)15,
11(4)18,
12(2)5,
12(3)11,
12(4)16,
13(2)7,
13(3)13
- integrate,
5(2)121,
10(3)15,
10(4)18,
11(1)3
- integrated,
8(2)9,
8(4)15,
11(2)7
- length,
7(1)3,
8(4)19,
9(3)12,
12(4)14
- Leveraging,
11(4)18
- lexicon,
8(2)9,
11(2)4,
11(2)6
- linear,
8(1)4,
12(1)3
- many,
5(2)89,
5(2)121,
7(2)7,
7(4)11,
7(4)12,
8(4)17,
9(1)1,
9(4)13,
10(1)2,
10(1)5,
10(4)17,
11(1)2,
12(1)2,
12(2)6,
12(3)9,
12(4)16,
13(4)17
- matching,
6(4)2,
8(2)6,
11(4)14,
11(4)16,
12(1)1
- minimum,
8(4)19,
12(1)2
- mining,
1(2)159,
5(1)1,
5(1)22,
5(1)74,
6(1)z,
7(2)6,
9(1)1,
9(4)15,
12(3)9,
12(3)11,
13(2)10
- more,
5(2)146,
6(2)7,
6(3)10,
7(3)9,
7(4)13,
8(1)4,
8(2)7,
8(3)12,
8(4)14,
8(4)16,
9(1)2,
9(2)6,
9(3)11,
9(3)12,
10(1)4,
11(2)4,
11(2)7,
12(1)1,
12(1)2,
12(3)9,
13(1)1,
13(1)3,
13(1)4,
13(2)8,
13(4)18
- named,
2(2)124,
2(3)290,
5(1)4,
5(2)121,
6(4)3,
7(1)1,
7(4)13,
9(4)15,
10(2)9,
10(3)15,
11(1)2,
12(3)10
- NE,
5(2)121,
7(1)1,
10(2)9,
11(1)2,
12(3)10
- NLP,
5(2)121,
6(4)3,
8(4)14,
9(4)15,
10(1)5,
11(4)15,
13(2)7
- novel,
4(3)243,
5(2)89,
5(2)165,
6(2)8,
6(4)2,
8(1)3,
8(3)12,
10(2)7,
10(3)14,
10(4)20,
11(1)3,
11(2)4,
11(3)11,
11(4)15,
11(4)17,
12(3)11,
12(3)12,
13(2)8,
13(3)13,
13(4)17
- one,
5(2)89,
5(2)121,
6(2)6,
6(3)9,
6(4)3,
7(3)8,
7(3)9,
7(4)11,
7(4)13,
8(2)9,
8(4)16,
8(4)17,
9(1)1,
9(2)5,
9(2)7,
9(3)12,
9(4)14,
10(1)5,
10(3)12,
10(3)13,
11(2)4,
11(2)6,
11(2)7,
11(4)14,
12(1)1,
12(1)2,
12(2)5,
12(2)7,
12(3)11,
12(4)16,
13(1)4,
13(2)10,
13(4)17,
13(4)18
- pair,
5(2)89,
5(2)121,
6(2)6,
6(3)11,
7(1)1,
7(3)8,
7(4)12,
8(1)3,
8(2)9,
8(4)17,
10(4)21,
11(3)11,
11(4)13,
11(4)18,
12(3)9,
12(4)14,
13(3)11
- possible,
7(2)6,
8(4)16,
8(4)18,
9(1)1,
9(1)3,
10(1)4,
10(3)15,
12(1)2
- present,
5(2)89,
5(2)165,
6(2)7,
6(3)10,
6(4)2,
7(1)2,
7(1)3,
7(2)7,
7(3)9,
7(4)11,
7(4)13,
8(1)3,
8(2)6,
8(2)7,
8(2)8,
8(3)10,
8(4)14,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
9(1)1,
9(1)2,
9(1)3,
9(2)6,
9(4)14,
10(1)4,
10(1)6,
10(2)7,
10(3)14,
10(4)18,
11(1)2,
11(1)3,
11(2)4,
11(2)5,
11(2)6,
11(3)10,
11(4)13,
12(1)3,
12(2)5,
12(3)9,
12(3)11,
12(4)15,
13(2)8,
13(4)16
- recent,
2(2)101,
4(4)375,
8(1)1,
8(3)12,
8(4)16,
11(4)15,
12(4)14
- research,
2(2)101,
5(2)89,
7(4)12,
8(1)2,
8(1)4,
8(4)18,
9(2)7,
9(3)12,
10(1)4,
10(3)14,
10(4)20,
10(4)21,
11(1)1,
11(1)2,
11(3)10,
12(1)3,
12(4)14,
13(1)1,
13(2)7,
13(2)10
- resource,
2(2)101,
2(2)124,
4(2)135,
5(2)89,
7(3)9,
7(4)11,
8(2)9,
8(3)12,
8(4)17,
9(2)5,
9(3)12,
9(4)14,
10(2)8,
10(3)12,
10(3)16,
11(4)14,
11(4)16,
11(4)18,
12(1)1,
12(4)14,
12(4)16,
13(1)1,
13(1)3,
13(2)7
- sample,
12(2)7,
13(2)6
- since,
5(2)89,
5(2)165,
8(2)9,
8(4)16,
8(4)18,
10(1)4,
10(1)5,
10(4)21,
11(2)7,
11(4)18,
12(1)2,
12(4)16,
13(4)17
- source,
5(2)121,
6(3)11,
8(2)6,
8(2)7,
8(2)8,
8(4)17,
9(1)1,
9(4)15,
10(3)12,
10(4)17,
11(4)18,
12(4)15,
13(1)1,
13(1)2,
13(3)12,
13(4)17
- transliteration,
5(2)121,
5(3)185,
6(1)z-1,
6(2)6,
9(1)1,
9(4)13,
9(4)14,
12(3)9
- type,
7(4)11,
8(4)17,
9(2)6,
9(3)11,
9(3)12,
11(1)2,
11(1)3,
11(4)18,
12(3)10,
12(3)11,
13(1)3,
13(2)6,
13(3)11
- valuable,
5(2)89,
6(2)8,
10(3)12
- various,
7(2)5,
8(1)3,
9(3)10,
9(3)11,
10(2)9,
10(3)13,
10(3)15,
11(2)5,
11(4)14,
12(2)6,
13(2)6,
13(2)10
- vector,
6(4)3,
7(2)7,
7(3)10,
11(2)5,
12(3)9
- which,
5(2)89,
5(2)121,
6(2)6,
6(2)8,
6(3)10,
6(4)1,
7(1)3,
7(2)7,
7(3)10,
7(4)13,
8(1)2,
8(1)4,
8(2)9,
8(3)10,
8(3)12,
8(4)14,
8(4)16,
8(4)18,
9(1)1,
9(2)5,
9(3)12,
9(4)14,
9(4)15,
10(1)4,
10(1)6,
10(2)7,
10(2)8,
10(2)9,
10(3)12,
10(3)13,
10(3)14,
10(3)15,
10(4)17,
10(4)20,
11(2)6,
11(3)8,
11(3)9,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)18,
12(1)1,
12(1)3,
12(1)4,
12(2)5,
12(2)6,
12(2)7,
12(3)10,
12(3)11,
12(4)15,
12(4)17,
13(1)1,
13(2)8,
13(3)13,
13(4)17,
13(4)18