Entry Hsu:2010:MST from talip.bib
Last update: Sun Oct 15 02:55:04 MDT 2017
Top |
Symbols |
Numbers |
Math |
A |
B |
C |
D |
E |
F |
G |
H |
I |
J |
K |
L |
M |
N |
O |
P |
Q |
R |
S |
T |
U |
V |
W |
X |
Y |
Z
BibTeX entry
@Article{Hsu:2010:MST,
author = "Chung-Chian Hsu and Chien-Hsing Chen",
title = "Mining Synonymous Transliterations from the {World
Wide Web}",
journal = j-TALIP,
volume = "9",
number = "1",
pages = "1:1--1:??",
month = mar,
year = "2010",
CODEN = "????",
DOI = "https://doi.org/10.1145/1731035.1731036",
ISSN = "1530-0226 (print), 1558-3430 (electronic)",
ISSN-L = "1530-0226",
bibdate = "Mon Mar 29 15:34:01 MDT 2010",
bibsource = "http://portal.acm.org/;
http://www.math.utah.edu/pub/tex/bib/talip.bib",
abstract = "The World Wide Web has been considered one of the
important sources for information. Using search engines
to retrieve Web pages can gather lots of information,
including foreign information. However, to be better
understood by local readers, proper names in a foreign
language, such as English, are often transliterated to
a local language such as Chinese. Due to different
translators and the lack of translation standard,
translating foreign proper nouns may result in
different transliterations and pose a notorious
headache. In particular, it may cause incomplete search
results. Using one transliteration as a query keyword
will fail to retrieve the Web pages which use a
different word as the transliteration. Consequently,
important information may be missed. We present a
framework for mining synonymous transliterations as
many as possible from the Web for a given
transliteration. The results can be used to construct a
database of synonymous transliterations which can be
utilized for query expansion so as to alleviate the
incomplete search problem. Experimental results show
that the proposed framework can effectively retrieve
the set of snippets which may contain synonymous
transliterations and then extract the target terms.
Most of the extracted synonymous transliterations have
higher rank of similarity to the input transliteration
compared to other noise terms.",
acknowledgement = ack-nhfb,
articleno = "1",
fjournal = "ACM Transactions on Asian Language Information
Processing",
journal-URL = "http://portal.acm.org/browse_dl.cfm?&idx=J820",
keywords = "Chinese transliteration; cross-lingual information
retrieval; synonymous transliteration; text mining; Web
mining",
}
Related entries
- alleviate,
6(3)9,
7(3)10,
8(2)9
- been,
5(2)121,
6(3)10,
6(4)3,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(1)2,
8(2)9,
8(4)14,
8(4)17,
8(4)18,
9(2)5,
9(4)15,
10(1)5,
10(4)17,
13(1)1,
13(2)6,
13(2)8,
13(2)9,
13(3)11,
13(3)12
- better,
6(2)8,
7(2)7,
7(4)13,
8(1)4,
8(3)11,
8(4)16,
9(2)7,
9(3)11,
9(3)12,
11(3)8,
11(4)13,
11(4)15,
12(2)7
- Chen, Chien-Hsing,
6(1)z-1
- compared,
5(2)121,
6(3)9,
6(3)11,
8(4)16,
9(3)11,
9(3)12,
10(4)17,
11(2)6,
12(1)2,
12(4)17,
13(1)2,
13(1)4,
13(2)6,
13(3)12
- consequently,
6(4)1,
8(4)16,
11(4)13
- considered,
5(2)165,
8(4)15,
9(2)5,
11(2)4,
12(1)4,
13(1)2
- construct,
9(2)6,
10(2)7,
10(2)9,
12(3)11
- contain,
7(4)11,
8(3)11,
9(2)7,
10(4)21,
11(3)10,
12(4)16
- cross-lingual,
2(2)164,
2(3)181,
2(3)245,
3(2)94,
4(2)57,
4(2)135,
13(1)3
- database,
6(2)6,
6(2)8
- different,
5(2)89,
6(3)9,
6(4)3,
7(2)7,
7(3)8,
7(4)13,
8(1)2,
8(2)7,
8(2)8,
8(3)11,
8(4)16,
8(4)17,
9(1)4,
9(2)5,
9(2)6,
9(3)12,
10(1)4,
10(1)5,
10(3)12,
10(4)17,
10(4)19,
11(3)8,
11(3)11,
11(4)16,
11(4)17,
11(4)18,
12(1)2,
12(3)11,
12(4)17,
13(2)6,
13(3)11,
13(4)16
- due,
5(2)121,
6(2)8,
7(2)7,
9(1)2,
9(4)15,
10(2)10,
10(3)12,
10(4)21,
11(2)7,
12(4)14,
13(1)4,
13(4)17
- effectively,
6(2)7,
6(2)8,
7(2)7,
7(4)12,
8(3)12,
11(3)10,
12(1)2
- engine,
4(3)305,
7(3)8,
9(3)11,
11(3)11,
12(4)14
- English,
2(3)245,
4(2)135,
5(2)89,
5(2)121,
5(3)245,
6(2)6,
6(2)7,
6(3)11,
6(4)2,
7(1)1,
7(4)11,
8(2)9,
8(4)15,
8(4)16,
8(4)17,
9(1)3,
9(2)7,
9(3)12,
9(4)14,
9(4)15,
10(1)2,
10(1)4,
10(2)8,
10(3)14,
10(3)15,
10(4)17,
11(2)4,
11(2)5,
11(2)6,
11(3)8,
11(3)11,
12(2)5,
12(3)12,
12(4)14,
12(4)17,
13(1)1,
13(4)16
- expansion,
4(2)57,
8(1)4,
9(3)12,
12(2)7,
13(3)13
- experimental,
5(2)121,
6(2)6,
6(2)7,
7(2)5,
7(2)6,
7(2)7,
7(3)10,
7(4)13,
8(1)2,
8(1)4,
8(2)9,
9(1)2,
10(2)7,
11(3)9,
11(4)14,
12(3)10,
12(4)14,
13(2)7
- extract,
6(3)11,
7(3)8,
7(3)10,
9(2)6,
11(1)2,
11(2)4,
11(2)6,
11(3)11,
11(4)15,
12(2)7,
12(3)9
- extracted,
3(4)227,
4(3)321,
6(2)8,
7(1)1,
7(1)3,
8(3)10,
11(2)6,
11(3)11,
13(2)9,
13(3)14,
13(4)16
- fail,
11(2)7,
11(3)8,
13(2)8
- framework,
3(1)11,
5(2)146,
5(4)360,
8(1)2,
8(1)4,
8(2)9,
8(3)12,
9(1)2,
9(2)5,
9(3)10,
10(3)13,
10(3)14,
10(3)15,
11(2)5,
11(4)15,
12(1)3,
12(4)15,
12(4)17,
13(2)9,
13(4)18
- given,
5(2)89,
5(2)165,
7(3)10,
7(4)13,
8(1)2,
9(2)7,
11(2)5,
11(3)8,
11(3)11,
11(4)13,
12(4)14,
13(1)2,
13(4)17
- has,
5(2)89,
5(2)121,
6(4)2,
6(4)3,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(1)2,
8(3)10,
8(4)16,
8(4)17,
8(4)18,
9(1)2,
9(1)3,
9(2)5,
9(4)15,
10(1)4,
10(1)5,
10(4)17,
11(1)2,
11(3)9,
12(1)1,
12(1)2,
12(4)15,
13(1)1,
13(2)6,
13(2)7,
13(2)8,
13(3)12,
13(4)18
- have,
5(2)121,
6(3)10,
6(4)2,
7(2)7,
7(3)8,
7(4)11,
7(4)12,
7(4)13,
8(2)8,
8(2)9,
8(4)14,
8(4)16,
8(4)17,
8(4)18,
9(1)3,
9(2)7,
9(4)15,
10(1)5,
10(2)7,
10(4)19,
10(4)20,
10(4)21,
11(1)2,
11(2)6,
11(3)8,
12(1)3,
12(2)6,
13(1)3,
13(2)6,
13(2)7,
13(2)9,
13(3)11,
13(3)12
- higher,
7(4)13,
12(2)7,
13(1)2
- however,
6(2)8,
7(2)7,
7(3)8,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(3)10,
9(3)12,
10(3)12,
10(4)18,
11(2)6,
11(2)7,
12(1)2,
12(2)7,
12(3)10,
12(3)11,
12(4)14,
13(3)11,
13(4)17
- Hsu, Chung-Chian,
6(1)z-1
- important,
5(4)413,
7(1)3,
7(3)10,
9(2)7,
9(4)13,
10(2)10,
11(4)18,
12(1)3,
13(3)12,
13(4)18
- including,
5(2)121,
6(2)7,
7(1)3,
7(2)7,
8(1)3,
8(2)6,
9(2)7,
9(3)11,
10(3)12,
11(4)18,
13(4)16
- information,
1(1)65,
1(1)83,
1(4)281,
2(3)245,
2(3)295,
3(1)1,
3(4)227,
4(2)57,
4(2)78,
4(3)243,
4(3)357,
4(4)375,
4(4)475,
5(1)44,
5(2)89,
5(3)264,
5(4)291,
5(4)296,
5(4)323,
6(2)7,
6(4)2,
7(1)2,
7(1)3,
7(2)5,
7(3)8,
7(4)12,
8(1)2,
8(1)3,
8(3)10,
8(3)11,
8(4)15,
8(4)16,
8(4)17,
9(2)7,
9(3)9,
9(3)10,
9(3)11,
9(3)12,
9(4)13,
9(4)14,
9(4)15,
10(2)8,
10(2)10,
10(3)15,
10(3)16,
10(4)19,
10(4)20,
10(4)21,
11(1)2,
11(2)6,
11(2)7,
11(4)15,
11(4)18,
12(2)5,
12(3)11,
12(4)16,
13(2)7,
13(3)13
- input,
5(2)165,
8(2)7,
9(1)3,
9(2)6,
10(1)6,
10(4)20,
12(1)2,
12(1)4,
12(2)6,
13(1)4,
13(2)8,
13(3)12,
13(4)17
- lack,
7(3)9,
8(4)14,
12(2)6,
12(2)7
- lingual, cross-,
2(3)181,
3(2)94,
4(2)57,
4(2)135,
13(1)3
- local,
7(4)12,
8(1)4,
8(4)15,
13(4)17
- many,
5(2)89,
5(2)121,
7(2)7,
7(4)11,
7(4)12,
8(4)17,
9(4)13,
10(1)2,
10(1)5,
10(4)17,
10(4)19,
11(1)2,
12(1)2,
12(2)6,
12(3)9,
12(4)16,
13(4)17
- may,
8(3)11,
8(4)16,
9(4)13,
12(1)4,
12(3)10,
13(4)17
- mining,
1(2)159,
5(1)1,
5(1)22,
5(1)74,
6(1)z,
7(2)6,
9(4)15,
10(4)19,
12(3)9,
12(3)11,
13(2)10
- most,
6(2)6,
7(1)1,
7(3)8,
7(3)10,
8(4)15,
9(2)5,
9(3)11,
10(1)5,
10(2)8,
12(1)1,
12(1)2,
13(1)1,
13(1)4,
13(2)6,
13(3)14,
13(4)18
- name,
2(3)169,
5(2)121,
7(1)1,
7(4)11,
9(1)2,
9(4)13,
11(1)2
- noise,
6(1)z-1,
10(4)21,
13(1)3
- noun,
3(1)33,
7(4)13,
9(2)7,
12(3)10
- often,
7(3)8,
10(3)14,
11(3)8,
12(1)2
- one,
5(2)89,
5(2)121,
6(2)6,
6(3)9,
6(4)3,
7(3)8,
7(3)9,
7(4)11,
7(4)13,
8(2)9,
8(4)16,
8(4)17,
9(2)5,
9(2)7,
9(3)12,
9(4)14,
10(1)5,
10(3)12,
10(3)13,
10(4)19,
11(2)4,
11(2)6,
11(2)7,
11(4)14,
12(1)1,
12(1)2,
12(2)5,
12(2)7,
12(3)11,
12(4)16,
13(1)4,
13(2)10,
13(4)17,
13(4)18
- other,
5(2)165,
7(2)6,
7(2)7,
7(3)8,
7(4)11,
8(1)2,
8(2)7,
8(4)14,
8(4)16,
8(4)17,
10(2)7,
10(4)20,
11(2)4,
11(2)7,
11(4)18,
12(1)1,
12(1)3,
12(3)11,
12(4)16,
13(1)3,
13(1)4,
13(2)7
- page,
7(3)8,
8(3)11,
8(3)12
- particular,
5(2)89,
8(4)18,
9(2)5,
9(4)15,
10(2)9,
10(4)18,
11(2)5
- pose,
7(1)3,
8(4)14
- possible,
7(2)6,
8(4)16,
8(4)18,
9(1)3,
10(1)4,
10(3)15,
10(4)19,
12(1)2
- present,
5(2)89,
5(2)165,
6(2)7,
6(3)10,
6(4)2,
7(1)2,
7(1)3,
7(2)7,
7(3)9,
7(4)11,
7(4)13,
8(1)3,
8(2)6,
8(2)7,
8(2)8,
8(3)10,
8(4)14,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
9(1)2,
9(1)3,
9(2)6,
9(4)14,
10(1)4,
10(1)6,
10(2)7,
10(3)14,
10(4)18,
10(4)19,
11(1)2,
11(1)3,
11(2)4,
11(2)5,
11(2)6,
11(3)10,
11(4)13,
12(1)3,
12(2)5,
12(3)9,
12(3)11,
12(4)15,
13(2)8,
13(4)16
- problem,
6(2)7,
6(3)9,
6(3)11,
6(4)1,
7(1)2,
7(2)7,
7(3)10,
8(1)2,
8(2)9,
8(3)10,
8(4)19,
9(1)3,
9(2)5,
9(4)13,
10(1)2,
10(1)4,
10(3)14,
10(3)16,
10(4)21,
11(3)8,
11(3)11,
11(4)17,
11(4)18,
12(1)2,
12(1)3,
12(2)7,
12(3)10,
12(3)12,
12(4)16,
13(2)8,
13(3)14,
13(4)17
- proposed,
5(2)121,
5(2)165,
6(2)7,
7(1)1,
7(1)2,
7(3)9,
7(3)10,
7(4)11,
7(4)13,
8(1)4,
8(2)6,
8(3)10,
8(3)11,
8(4)14,
8(4)19,
9(2)5,
9(2)7,
10(2)7,
10(2)9,
10(3)14,
10(4)18,
11(1)3,
11(2)5,
11(2)6,
11(2)7,
11(3)8,
11(3)9,
11(3)10,
11(3)11,
11(4)16,
11(4)17,
12(1)4,
12(2)5,
12(2)7,
12(3)12,
12(4)16,
12(4)17,
13(2)6,
13(2)8,
13(3)13,
13(4)18
- query,
1(2)123,
1(2)159,
4(2)57,
5(3)245,
5(4)323,
5(4)360,
6(2)8,
6(4)2,
7(2)5,
9(3)12,
11(2)6,
11(3)11,
11(4)17,
13(2)6,
13(3)13
- rank,
7(2)6,
10(1)3,
11(3)11
- result,
4(2)135,
5(2)121,
5(2)146,
5(2)165,
6(2)6,
6(2)7,
6(3)9,
6(3)11,
6(4)3,
7(1)2,
7(2)5,
7(2)6,
7(2)7,
7(3)8,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(1)2,
8(1)3,
8(1)4,
8(2)6,
8(2)9,
8(3)10,
8(3)12,
8(4)14,
8(4)15,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
9(1)2,
9(2)5,
9(2)6,
9(2)7,
9(3)11,
9(3)12,
9(4)14,
10(1)2,
10(2)7,
11(2)4,
11(2)5,
11(3)8,
11(3)9,
11(3)11,
11(4)13,
11(4)14,
11(4)15,
12(1)3,
12(1)4,
12(2)5,
12(2)7,
12(3)9,
12(3)10,
12(3)11,
12(4)14,
12(4)16,
13(1)1,
13(1)4,
13(2)6,
13(2)7,
13(2)9,
13(3)11,
13(3)12,
13(3)14
- retrieval,
1(3)225,
1(4)281,
2(1)1,
2(2)164,
3(2)128,
4(1)1,
4(2)57,
4(2)78,
4(2)135,
4(2)186,
4(3)340,
4(3)357,
4(4)377,
4(4)475,
5(2)89,
5(3)264,
5(4)296,
5(4)323,
6(2)8,
6(4)2,
7(2)5,
7(3)8,
7(4)12,
8(1)1,
8(1)2,
9(3)9,
9(3)10,
9(3)11,
9(3)12,
9(4)13,
9(4)14,
10(2)8,
10(4)20,
11(1)2,
11(3)11,
13(2)6,
13(2)7,
13(3)13,
13(4)18
- retrieve,
6(2)8,
11(3)11
- search,
2(3)219,
4(2)159,
4(3)280,
6(2)8,
6(4)2,
7(3)8,
8(1)2,
8(2)8,
8(3)12,
9(3)11,
10(2)9,
10(3)16,
11(3)8,
11(3)11
- set,
1(3)269,
5(2)121,
6(1)z,
7(1)3,
7(3)8,
7(4)11,
7(4)13,
8(3)10,
8(3)12,
8(4)15,
9(1)3,
9(2)5,
10(1)4,
10(2)8,
10(4)20,
11(2)5,
11(2)7,
11(3)10,
11(3)11,
11(4)13,
11(4)14,
12(1)2,
12(1)4,
12(3)9,
13(2)8,
13(2)9,
13(3)12,
13(3)13,
13(4)17
- show,
5(2)89,
5(2)146,
7(1)1,
7(1)2,
7(1)3,
7(4)11,
7(4)12,
7(4)13,
8(1)4,
8(2)7,
8(2)9,
8(3)12,
8(4)16,
8(4)17,
9(1)2,
9(1)3,
9(2)5,
9(2)6,
9(2)7,
9(3)11,
9(3)12,
9(4)14,
10(1)3,
10(3)15,
11(2)4,
11(2)5,
11(2)7,
11(3)8,
11(3)11,
11(4)14,
11(4)15,
11(4)17,
11(4)18,
12(1)2,
12(1)4,
12(2)5,
12(2)7,
12(3)9,
12(3)10,
12(3)11,
12(4)15,
12(4)16,
13(1)3,
13(2)6,
13(2)7,
13(2)9,
13(3)14
- similarity,
5(2)89,
5(2)165,
6(1)z-1,
6(2)6,
7(3)8,
8(2)6,
8(2)9,
10(2)10,
11(2)5,
11(2)6,
11(3)9,
11(3)11
- snippets,
8(3)12
- source,
5(2)121,
6(3)11,
8(2)6,
8(2)7,
8(2)8,
8(4)17,
9(4)15,
10(3)12,
10(4)17,
10(4)19,
11(4)18,
12(4)15,
13(1)1,
13(1)2,
13(3)12,
13(4)17
- standard,
6(3)10,
7(4)11,
8(4)14,
8(4)15,
8(4)18,
9(2)5,
9(2)6,
10(3)12,
11(2)5,
11(4)18,
13(2)7,
13(3)13,
13(4)17
- such,
7(2)7,
7(3)8,
7(3)10,
7(4)12,
8(2)8,
8(3)10,
8(3)11,
8(3)12,
8(4)14,
8(4)16,
8(4)17,
9(3)12,
9(4)13,
9(4)15,
10(1)5,
10(2)8,
10(3)12,
10(4)21,
11(1)2,
11(2)5,
11(2)7,
11(3)8,
11(3)10,
11(3)11,
11(4)13,
11(4)16,
11(4)17,
11(4)18,
12(1)1,
12(1)2,
12(2)6,
12(3)10,
12(3)11,
12(4)14,
12(4)17,
13(1)1,
13(3)12,
13(4)17
- target,
5(2)121,
6(4)1,
7(4)13,
8(1)3,
8(2)7,
8(2)8,
8(3)12,
8(4)17,
10(3)12,
10(4)17,
11(4)17,
12(2)7,
12(3)11,
12(3)12
- term,
1(1)34,
4(3)357,
5(1)22,
7(2)5,
7(2)7,
7(4)12,
8(2)9,
9(3)12,
10(4)17,
11(2)4,
11(3)9,
12(2)5,
12(4)15,
13(3)13
- text,
1(1)34,
1(2)159,
3(3)190,
3(4)215,
4(1)38,
4(2)135,
4(4)435,
5(1)1,
5(2)165,
6(1)z-3,
6(3)10,
6(4)2,
7(2)6,
7(3)8,
7(3)9,
8(1)4,
8(3)11,
8(4)14,
8(4)16,
8(4)18,
9(3)10,
9(4)15,
10(3)14,
11(1)2,
11(2)4,
11(2)5,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)17,
11(4)18,
12(1)2,
12(1)3,
12(2)6,
12(3)11,
12(4)15,
13(1)1,
13(1)4,
13(2)7,
13(2)8,
13(2)9,
13(2)10,
13(3)14
- then,
5(2)121,
6(2)6,
7(1)1,
7(3)10,
7(4)12,
8(1)4,
8(2)7,
8(3)10,
8(3)11,
8(3)12,
8(4)14,
9(2)7,
9(3)11,
10(2)7,
10(3)13,
10(4)20,
11(1)3,
11(2)7,
11(3)11,
11(4)15,
12(1)3,
12(3)10,
12(4)17,
13(1)4,
13(2)9,
13(3)13,
13(4)16
- translating,
5(2)121,
8(1)4,
8(2)9
- translators,
12(4)15
- transliterated,
13(2)6
- transliteration,
5(2)121,
5(3)185,
6(1)z-1,
6(2)6,
9(4)13,
9(4)14,
10(4)19,
12(3)9
- use,
4(2)159,
5(2)89,
5(2)146,
6(2)8,
6(3)11,
7(2)6,
7(3)9,
7(4)11,
7(4)12,
8(1)3,
8(2)9,
8(3)10,
8(3)11,
9(1)3,
9(3)11,
10(1)3,
10(1)4,
11(1)1,
11(2)6,
11(2)7,
11(3)8,
11(3)10,
11(4)14,
11(4)18,
12(1)1,
12(2)6,
12(3)9,
12(3)10,
13(2)6,
13(2)9,
13(2)10,
13(3)12
- used,
5(2)89,
5(2)146,
7(1)3,
7(2)6,
7(2)7,
7(3)9,
7(4)12,
7(4)13,
8(3)10,
8(4)17,
9(1)3,
9(2)6,
9(3)10,
10(1)2,
10(1)6,
10(2)7,
10(2)8,
10(3)12,
10(3)13,
10(4)20,
11(1)2,
11(1)3,
11(3)10,
11(4)13,
11(4)14,
12(2)5,
12(3)9,
12(3)11,
12(3)12,
13(2)6,
13(3)11
- utilized,
10(4)18,
11(4)14,
11(4)16
- Web,
1(2)159,
3(1)66,
6(2)6,
7(3)8,
7(4)11,
8(3)12,
9(4)15,
10(4)21,
11(2)4,
11(3)11,
11(4)16
- which,
5(2)89,
5(2)121,
6(2)6,
6(2)8,
6(3)10,
6(4)1,
7(1)3,
7(2)7,
7(3)10,
7(4)13,
8(1)2,
8(1)4,
8(2)9,
8(3)10,
8(3)12,
8(4)14,
8(4)16,
8(4)18,
9(2)5,
9(3)12,
9(4)14,
9(4)15,
10(1)4,
10(1)6,
10(2)7,
10(2)8,
10(2)9,
10(3)12,
10(3)13,
10(3)14,
10(3)15,
10(4)17,
10(4)19,
10(4)20,
11(2)6,
11(3)8,
11(3)9,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)18,
12(1)1,
12(1)3,
12(1)4,
12(2)5,
12(2)6,
12(2)7,
12(3)10,
12(3)11,
12(4)15,
12(4)17,
13(1)1,
13(2)8,
13(3)13,
13(4)17,
13(4)18
- wide,
7(4)13
- will,
5(2)146,
11(1)1,
11(2)6,
12(2)5,
12(2)6
- world,
5(2)89,
6(3)10,
8(2)9,
9(3)11,
9(4)13,
11(4)18,
12(2)6,
13(4)18