Entry Andrade:2012:SEC from talip.bib
Last update: Sun Oct 15 02:55:04 MDT 2017
Top |
Symbols |
Numbers |
Math |
A |
B |
C |
D |
E |
F |
G |
H |
I |
J |
K |
L |
M |
N |
O |
P |
Q |
R |
S |
T |
U |
V |
W |
X |
Y |
Z
BibTeX entry
@Article{Andrade:2012:SEC,
author = "Daniel Andrade and Takuya Matsuzaki and Jun'ichi
Tsujii",
title = "Statistical Extraction and Comparison of Pivot Words
for Bilingual Lexicon Extension",
journal = j-TALIP,
volume = "11",
number = "2",
pages = "6:1--6:??",
month = jun,
year = "2012",
DOI = "https://doi.org/10.1145/2184436.2184439",
ISSN = "1530-0226 (print), 1558-3430 (electronic)",
ISSN-L = "1530-0226",
bibdate = "Tue Jun 12 11:20:16 MDT 2012",
bibsource = "http://portal.acm.org/;
http://www.math.utah.edu/pub/tex/bib/talip.bib",
abstract = "Bilingual dictionaries can be automatically extended
by new translations using comparable corpora. The
general idea is based on the assumption that similar
words have similar contexts across languages. However,
previous studies have mainly focused on Indo-European
languages, or use only a bag-of-words model to describe
the context. Furthermore, we argue that it is helpful
to extract only the statistically significant context,
instead of using all context. The present approach
addresses these issues in the following manner. First,
based on the context of a word with an unknown
translation (query word), we extract salient pivot
words. Pivot words are words for which a translation is
already available in a bilingual dictionary. For the
extraction of salient pivot words, we use a Bayesian
estimation of the point-wise mutual information to
measure statistical significance. In the second step,
we match these pivot words across languages to identify
translation candidates for the query word. We therefore
calculate a similarity score between the query word and
a translation candidate using the probability that the
same pivots will be extracted for both the query word
and the translation candidate. The proposed method uses
several context positions, namely, a bag-of-words of
one sentence, and the successors, predecessors, and
siblings with respect to the dependency parse tree of
the sentence. In order to make these context positions
comparable across Japanese and English, which are
unrelated languages, we use several heuristics to
adjust the dependency trees appropriately. We
demonstrate that the proposed method significantly
increases the accuracy of word translations, as
compared to previous methods.",
acknowledgement = ack-nhfb,
articleno = "6",
fjournal = "ACM Transactions on Asian Language Information
Processing (TALIP)",
journal-URL = "http://portal.acm.org/browse_dl.cfm?&idx=J820",
}
Related entries
- accuracy,
6(4)1,
7(1)1,
7(1)2,
8(3)11,
8(4)15,
9(1)4,
10(2)7,
10(4)17,
11(3)9,
12(1)4,
12(2)7,
12(3)10,
12(3)11,
12(3)12,
12(4)15,
13(3)12,
13(3)14
- across,
6(3)10,
8(2)7,
11(3)11
- address,
6(3)11,
7(1)2,
7(1)3,
8(2)6,
8(4)15,
8(4)18,
8(4)19,
9(1)3,
10(3)13,
10(4)21,
11(4)13,
11(4)17,
13(1)1,
13(2)8,
13(4)17
- all,
6(4)2,
7(1)1,
7(2)7,
7(3)8,
7(4)11,
7(4)12,
8(2)7,
8(4)16,
8(4)17,
9(2)5,
9(3)11,
9(3)12,
10(2)9,
10(3)15,
11(2)7,
11(4)18,
12(2)5,
12(3)9,
13(1)2,
13(2)6,
13(4)16
- already,
5(2)89,
8(4)14
- appropriately,
11(3)10
- argue,
8(4)19,
13(1)4,
13(2)10
- assumption,
10(2)9,
12(3)9
- automatically,
3(4)227,
5(2)89,
5(2)121,
5(2)165,
7(1)1,
7(2)6,
8(1)3,
8(2)7,
8(3)10,
9(2)6,
10(3)12,
11(4)16,
12(2)7,
12(4)15,
13(3)12,
13(4)16
- available,
5(2)89,
8(1)3,
8(4)17,
9(2)5,
10(2)8,
11(1)1,
11(2)7,
11(4)18,
12(4)14,
13(1)1
- based,
1(3)269,
2(4)301,
3(2)113,
4(3)357,
4(4)377,
5(2)121,
5(2)165,
5(3)185,
6(2)8,
6(3)9,
6(3)11,
6(4)3,
7(2)6,
7(3)10,
7(4)12,
8(1)4,
8(3)11,
8(3)12,
8(4)17,
8(4)19,
9(1)2,
9(2)5,
9(2)6,
9(2)7,
9(3)11,
10(1)4,
10(1)6,
10(2)7,
10(3)14,
10(3)16,
11(3)8,
11(3)11,
11(4)14,
11(4)15,
11(4)16,
11(4)17,
11(4)18,
12(1)1,
12(1)2,
12(1)4,
12(3)9,
12(3)10,
12(3)11,
13(1)2,
13(1)3,
13(1)4,
13(2)10,
13(3)13,
13(4)17,
13(4)18
- Bayesian,
11(3)9,
12(3)9
- bilingual,
4(2)78,
5(2)89,
5(2)121,
6(3)11,
7(1)1,
8(2)9,
10(3)16,
10(4)19,
12(3)9
- both,
6(2)6,
6(2)7,
6(3)10,
7(1)1,
7(1)2,
7(1)3,
7(3)8,
8(2)7,
8(3)11,
8(3)12,
9(1)2,
9(1)4,
9(2)5,
10(1)2,
10(1)4,
10(1)6,
10(2)10,
10(3)13,
10(3)15,
10(4)20,
10(4)21,
11(2)4,
11(2)7,
11(3)9,
11(4)18,
12(2)5,
12(2)7,
12(4)17,
13(2)9,
13(4)17
- calculate,
7(4)12,
11(2)5
- candidate,
5(2)121,
6(2)6,
7(2)5,
7(2)6,
10(1)3,
10(3)16,
10(4)21,
11(3)8,
12(3)9,
12(4)15,
13(1)2
- comparable,
6(3)11,
10(4)19,
12(3)9,
12(3)12,
13(4)17
- compared,
5(2)121,
6(3)9,
6(3)11,
8(4)16,
9(1)1,
9(3)11,
9(3)12,
10(4)17,
12(1)2,
12(4)17,
13(1)2,
13(1)4,
13(2)6,
13(3)12
- comparison,
1(2)145,
1(3)225,
2(3)193,
6(3)9,
8(1)2,
9(3)11,
9(3)12,
13(1)3
- context,
6(4)2,
8(4)15,
9(2)7,
9(4)14,
10(1)3,
10(4)18,
10(4)19,
11(2)7,
11(3)9,
12(1)2,
13(1)2
- corpora,
5(2)89,
5(2)121,
6(2)6,
6(3)11,
7(2)6,
9(2)5,
9(4)13,
10(3)15,
10(4)19,
10(4)21,
11(2)7,
11(3)11,
12(2)7,
13(1)1,
13(1)3,
13(2)9,
13(3)11
- demonstrate,
5(2)121,
6(4)1,
7(1)2,
7(2)7,
7(3)10,
8(2)7,
8(2)9,
9(1)4,
9(3)11,
11(3)8,
13(1)1,
13(1)3
- dependency,
6(3)9,
8(3)10,
9(2)7,
10(3)15,
11(4)18
- describe,
6(3)9,
6(4)3,
7(2)5,
7(2)6,
7(2)7,
7(3)9,
7(4)12,
8(4)14,
9(3)10,
9(3)11,
10(1)5,
12(1)3,
12(2)5,
13(1)1,
13(1)4,
13(2)9
- dictionary,
1(4)281,
5(2)121,
6(3)11,
7(3)9,
9(1)4,
10(1)3,
10(2)7,
11(4)16,
12(2)7,
13(3)14
- English,
2(3)245,
4(2)135,
5(2)89,
5(2)121,
5(3)245,
6(2)6,
6(2)7,
6(3)11,
6(4)2,
7(1)1,
7(4)11,
8(2)9,
8(4)15,
8(4)16,
8(4)17,
9(1)1,
9(1)3,
9(2)7,
9(3)12,
9(4)14,
9(4)15,
10(1)2,
10(1)4,
10(2)8,
10(3)14,
10(3)15,
10(4)17,
11(2)4,
11(2)5,
11(3)8,
11(3)11,
12(2)5,
12(3)12,
12(4)14,
12(4)17,
13(1)1,
13(4)16
- estimation,
8(2)6,
8(4)19,
11(1)3
- European, Indo-,
7(3)9,
9(3)11,
12(4)14,
13(2)7
- extended,
5(3)183,
7(3)10,
7(4)13,
8(4)15,
8(4)18,
9(1)3,
13(4)16
- extension,
7(4)13,
9(1)4,
11(3)9,
11(4)15
- extract,
6(3)11,
7(3)8,
7(3)10,
9(1)1,
9(2)6,
11(1)2,
11(2)4,
11(3)11,
11(4)15,
12(2)7,
12(3)9
- extracted,
3(4)227,
4(3)321,
6(2)8,
7(1)1,
7(1)3,
8(3)10,
9(1)1,
11(3)11,
13(2)9,
13(3)14,
13(4)16
- extraction,
1(1)34,
2(3)295,
5(1)61,
5(2)121,
6(2)6,
7(1)1,
8(4)16,
8(4)17,
10(3)14,
10(3)15,
11(1)2,
12(3)11,
13(1)3
- first,
5(2)165,
6(2)6,
6(4)3,
7(1)1,
7(3)8,
7(3)10,
8(2)7,
8(3)10,
8(3)11,
8(4)19,
9(3)10,
9(3)11,
10(3)13,
11(2)7,
11(3)8,
11(3)9,
11(3)11,
12(1)3,
12(1)4,
12(2)5,
12(3)10,
12(4)17,
13(2)7,
13(2)9,
13(3)13,
13(4)17
- focused,
5(2)121,
6(3)10,
11(4)13
- following,
7(2)7,
11(3)8,
12(3)10
- Furthermore,
6(2)7,
7(1)1,
7(4)11,
8(4)17,
9(2)6,
12(1)2,
12(2)7,
12(4)16,
13(1)1
- general,
8(4)14,
9(3)12,
10(3)12,
11(2)7,
11(3)10,
12(2)6,
12(4)14,
12(4)15
- have,
5(2)121,
6(3)10,
6(4)2,
7(2)7,
7(3)8,
7(4)11,
7(4)12,
7(4)13,
8(2)8,
8(2)9,
8(4)14,
8(4)16,
8(4)17,
8(4)18,
9(1)1,
9(1)3,
9(2)7,
9(4)15,
10(1)5,
10(2)7,
10(4)19,
10(4)20,
10(4)21,
11(1)2,
11(3)8,
12(1)3,
12(2)6,
13(1)3,
13(2)6,
13(2)7,
13(2)9,
13(3)11,
13(3)12
- helpful,
10(4)17,
10(4)18
- heuristic,
7(4)12
- however,
6(2)8,
7(2)7,
7(3)8,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(3)10,
9(1)1,
9(3)12,
10(3)12,
10(4)18,
11(2)7,
12(1)2,
12(2)7,
12(3)10,
12(3)11,
12(4)14,
13(3)11,
13(4)17
- idea,
8(3)12,
10(3)15,
11(3)8,
13(1)4
- identify,
5(2)146,
6(2)6,
8(3)11,
9(3)12,
10(1)5,
11(4)18,
12(3)10
- increase,
7(2)5,
7(3)9,
8(2)7,
8(4)15,
9(3)12,
9(4)15,
10(2)8,
11(4)18,
12(2)6,
12(3)11
- Indo-European,
7(3)9,
9(3)11,
12(4)14,
13(2)7
- information,
1(1)65,
1(1)83,
1(4)281,
2(3)245,
2(3)295,
3(1)1,
3(4)227,
4(2)57,
4(2)78,
4(3)243,
4(3)357,
4(4)375,
4(4)475,
5(1)44,
5(2)89,
5(3)264,
5(4)291,
5(4)296,
5(4)323,
6(2)7,
6(4)2,
7(1)2,
7(1)3,
7(2)5,
7(3)8,
7(4)12,
8(1)2,
8(1)3,
8(3)10,
8(3)11,
8(4)15,
8(4)16,
8(4)17,
9(1)1,
9(2)7,
9(3)9,
9(3)10,
9(3)11,
9(3)12,
9(4)13,
9(4)14,
9(4)15,
10(2)8,
10(2)10,
10(3)15,
10(3)16,
10(4)19,
10(4)20,
10(4)21,
11(1)2,
11(2)7,
11(4)15,
11(4)18,
12(2)5,
12(3)11,
12(4)16,
13(2)7,
13(3)13
- instead,
7(3)8,
9(2)5,
11(1)2
- issue,
3(1)1,
3(2)87,
3(4)213,
4(3)237,
4(4)375,
5(4)291,
6(2)7,
6(3)10,
7(1)2,
7(1)3,
7(2)4,
7(3)9,
7(4)11,
8(1)1,
8(2)5,
8(2)6,
8(3)12,
8(4)13,
9(3)9,
10(1)1,
10(3)11,
10(3)13,
10(4)18,
11(1)2,
11(4)12
- Japanese,
4(3)263,
4(3)280,
4(4)375,
5(2)146,
5(3)264,
6(3)11,
6(4)1,
7(2)6,
7(2)7,
7(3)8,
8(2)9,
9(1)4,
9(2)7,
11(3)8,
11(3)11,
11(4)14,
11(4)18,
12(1)3,
12(2)7,
12(3)10,
12(3)11,
12(4)16,
12(4)17
- lexicon,
8(2)9,
10(4)19,
11(2)4
- mainly,
7(2)7,
10(3)14,
12(1)2
- make,
6(4)2,
7(3)9,
8(2)9,
9(3)11,
11(4)15,
12(4)14,
12(4)15,
13(1)1,
13(1)3,
13(2)8
- manner,
8(3)12,
9(2)7,
12(3)9
- match,
7(4)11
- measure,
5(2)89,
6(2)6,
6(4)3,
8(2)7,
9(2)7,
10(1)2,
10(1)6,
10(4)20,
11(3)9,
11(3)11,
13(3)11,
13(3)13,
13(3)14
- namely,
7(4)12,
8(1)4,
10(2)9,
12(1)4,
12(4)16
- new,
5(1)74,
5(2)121,
6(2)8,
6(3)9,
7(2)7,
7(4)11,
8(2)6,
9(1)4,
9(2)7,
10(1)4,
10(3)15,
10(4)17,
10(4)20,
12(1)1,
12(1)3,
12(3)8,
12(3)9,
12(4)14,
13(1)1,
13(1)2,
13(2)6
- one,
5(2)89,
5(2)121,
6(2)6,
6(3)9,
6(4)3,
7(3)8,
7(3)9,
7(4)11,
7(4)13,
8(2)9,
8(4)16,
8(4)17,
9(1)1,
9(2)5,
9(2)7,
9(3)12,
9(4)14,
10(1)5,
10(3)12,
10(3)13,
10(4)19,
11(2)4,
11(2)7,
11(4)14,
12(1)1,
12(1)2,
12(2)5,
12(2)7,
12(3)11,
12(4)16,
13(1)4,
13(2)10,
13(4)17,
13(4)18
- only,
5(2)89,
5(2)165,
7(4)12,
7(4)13,
8(4)17,
9(2)5,
9(4)14,
12(1)3,
12(3)9,
12(3)11,
13(2)6,
13(4)18
- order,
7(4)13,
8(2)8,
8(3)10,
10(1)2,
10(4)17,
11(3)8,
11(4)18,
12(2)5,
12(2)6,
12(3)9,
12(3)11,
12(4)14,
12(4)17,
13(1)2,
13(3)11,
13(3)12
- parse,
7(4)13,
10(3)15
- pivot,
8(2)9,
12(4)14
- position,
8(2)8,
10(3)14,
13(1)2
- present,
5(2)89,
5(2)165,
6(2)7,
6(3)10,
6(4)2,
7(1)2,
7(1)3,
7(2)7,
7(3)9,
7(4)11,
7(4)13,
8(1)3,
8(2)6,
8(2)7,
8(2)8,
8(3)10,
8(4)14,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
9(1)1,
9(1)2,
9(1)3,
9(2)6,
9(4)14,
10(1)4,
10(1)6,
10(2)7,
10(3)14,
10(4)18,
10(4)19,
11(1)2,
11(1)3,
11(2)4,
11(2)5,
11(3)10,
11(4)13,
12(1)3,
12(2)5,
12(3)9,
12(3)11,
12(4)15,
13(2)8,
13(4)16
- previous,
5(2)89,
5(2)121,
7(2)7,
7(4)13,
9(2)5,
10(3)15,
10(4)18,
13(2)6,
13(3)12,
13(4)18
- probability,
5(2)121,
6(2)6,
8(4)19,
10(1)6,
10(3)16,
11(2)5,
12(3)9,
13(4)18
- proposed,
5(2)121,
5(2)165,
6(2)7,
7(1)1,
7(1)2,
7(3)9,
7(3)10,
7(4)11,
7(4)13,
8(1)4,
8(2)6,
8(3)10,
8(3)11,
8(4)14,
8(4)19,
9(1)1,
9(2)5,
9(2)7,
10(2)7,
10(2)9,
10(3)14,
10(4)18,
11(1)3,
11(2)5,
11(2)7,
11(3)8,
11(3)9,
11(3)10,
11(3)11,
11(4)16,
11(4)17,
12(1)4,
12(2)5,
12(2)7,
12(3)12,
12(4)16,
12(4)17,
13(2)6,
13(2)8,
13(3)13,
13(4)18
- query,
1(2)123,
1(2)159,
4(2)57,
5(3)245,
5(4)323,
5(4)360,
6(2)8,
6(4)2,
7(2)5,
9(1)1,
9(3)12,
11(3)11,
11(4)17,
13(2)6,
13(3)13
- respect,
7(3)9,
8(4)15,
9(1)3
- salient,
7(1)3,
7(3)9
- same,
7(4)11,
9(1)3,
9(2)6,
10(2)10,
12(4)16,
13(2)6
- score,
7(2)7,
7(4)12,
8(2)7,
8(3)10,
9(1)3,
9(2)6,
10(4)18,
12(3)9,
12(4)17,
13(1)2,
13(3)13,
13(4)16
- second,
5(2)89,
8(1)4,
8(2)7,
8(4)19,
11(1)3,
11(3)8,
11(3)9,
11(3)11,
12(1)3,
13(2)7,
13(4)17
- sentence,
1(3)173,
3(2)146,
4(3)321,
4(4)377,
5(2)121,
5(2)146,
5(2)165,
7(1)3,
7(2)6,
7(4)13,
8(1)3,
8(2)8,
9(1)2,
9(2)6,
10(4)21,
11(1)3,
11(2)5,
11(3)8,
11(3)10,
11(3)11,
12(1)2,
12(1)3,
12(2)7,
12(4)14,
12(4)17,
13(1)2,
13(3)11,
13(4)17
- several,
6(2)6,
6(2)7,
6(4)3,
7(2)5,
7(2)7,
7(3)10,
8(3)10,
8(4)16,
8(4)17,
8(4)18,
9(3)12,
11(4)13,
11(4)16,
12(1)2,
13(3)12,
13(3)14
- significance,
8(4)14,
13(3)11,
13(3)13
- significant,
5(2)121,
7(1)3,
8(1)4,
8(4)15,
8(4)16,
8(4)17,
8(4)18,
9(2)5,
9(3)11,
10(1)5,
10(2)8,
10(3)14,
11(2)7,
12(1)1,
12(4)16,
13(1)3,
13(3)14,
13(4)16
- significantly,
7(1)1,
7(4)13,
8(2)6,
8(4)15,
8(4)18,
9(1)2,
9(2)6,
9(3)12,
11(4)13,
11(4)17,
12(4)16,
13(2)6,
13(4)17
- similar,
5(2)146,
7(3)8,
7(4)11,
8(3)12,
9(3)11,
9(3)12,
10(1)2,
10(2)10,
11(3)11,
12(1)2,
12(4)17,
13(2)8
- similarity,
5(2)89,
5(2)165,
6(1)z-1,
6(2)6,
7(3)8,
8(2)6,
8(2)9,
9(1)1,
10(2)10,
11(2)5,
11(3)9,
11(3)11
- statistical,
1(1)3,
3(2)87,
3(4)243,
5(2)121,
5(4)323,
5(4)360,
6(1)z-4,
7(1)1,
8(1)2,
8(1)4,
8(2)6,
8(2)7,
8(2)8,
8(2)9,
8(3)10,
8(4)15,
8(4)19,
9(2)6,
9(2)7,
9(3)11,
10(4)18,
11(2)7,
11(3)8,
11(4)15,
12(1)1,
12(3)12,
12(4)14,
12(4)16,
12(4)17,
13(1)2,
13(1)3,
13(1)4,
13(4)17
- statistically,
7(4)13,
8(4)16,
9(3)11
- step,
7(3)8,
8(2)8,
8(4)16,
9(3)12,
10(1)5,
10(3)12,
12(1)2,
12(2)7,
13(3)14,
13(4)17
- study,
4(2)159,
4(3)243,
5(2)121,
5(2)146,
5(2)165,
5(3)209,
6(2)6,
6(2)7,
8(1)3,
8(1)4,
8(4)16,
9(2)5,
9(2)6,
9(2)7,
9(3)11,
10(2)10,
10(3)12,
10(4)17,
10(4)18,
11(1)3,
11(3)9,
11(3)11,
11(4)14,
13(1)3,
13(2)7,
13(3)11,
13(3)12,
13(3)14
- therefore,
7(1)2,
8(4)16,
8(4)17,
11(2)5,
11(3)8,
11(3)11,
11(4)13,
12(2)7,
12(4)16,
13(2)8
- tree,
7(4)13,
10(3)12,
10(3)15,
10(4)18
- Tsujii, Jun'ichi,
1(1)1,
8(2)9,
12(2)5
- unknown,
7(2)5,
10(3)16,
11(3)9,
12(4)16
- use,
4(2)159,
5(2)89,
5(2)146,
6(2)8,
6(3)11,
7(2)6,
7(3)9,
7(4)11,
7(4)12,
8(1)3,
8(2)9,
8(3)10,
8(3)11,
9(1)1,
9(1)3,
9(3)11,
10(1)3,
10(1)4,
11(1)1,
11(2)7,
11(3)8,
11(3)10,
11(4)14,
11(4)18,
12(1)1,
12(2)6,
12(3)9,
12(3)10,
13(2)6,
13(2)9,
13(2)10,
13(3)12
- which,
5(2)89,
5(2)121,
6(2)6,
6(2)8,
6(3)10,
6(4)1,
7(1)3,
7(2)7,
7(3)10,
7(4)13,
8(1)2,
8(1)4,
8(2)9,
8(3)10,
8(3)12,
8(4)14,
8(4)16,
8(4)18,
9(1)1,
9(2)5,
9(3)12,
9(4)14,
9(4)15,
10(1)4,
10(1)6,
10(2)7,
10(2)8,
10(2)9,
10(3)12,
10(3)13,
10(3)14,
10(3)15,
10(4)17,
10(4)19,
10(4)20,
11(3)8,
11(3)9,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)18,
12(1)1,
12(1)3,
12(1)4,
12(2)5,
12(2)6,
12(2)7,
12(3)10,
12(3)11,
12(4)15,
12(4)17,
13(1)1,
13(2)8,
13(3)13,
13(4)17,
13(4)18
- will,
5(2)146,
9(1)1,
11(1)1,
12(2)5,
12(2)6