Entry Chen:2009:WTM from talip.bib
Last update: Sun Oct 15 02:55:04 MDT 2017
Top |
Symbols |
Numbers |
Math |
A |
B |
C |
D |
E |
F |
G |
H |
I |
J |
K |
L |
M |
N |
O |
P |
Q |
R |
S |
T |
U |
V |
W |
X |
Y |
Z
BibTeX entry
@Article{Chen:2009:WTM,
author = "Berlin Chen",
title = "Word Topic Models for Spoken Document Retrieval and
Transcription",
journal = j-TALIP,
volume = "8",
number = "1",
pages = "2:1--2:??",
month = mar,
year = "2009",
CODEN = "????",
DOI = "https://doi.org/10.1145/1482343.1482345",
ISSN = "1530-0226 (print), 1558-3430 (electronic)",
ISSN-L = "1530-0226",
bibdate = "Mon Mar 23 16:32:22 MDT 2009",
bibsource = "http://portal.acm.org/;
http://www.math.utah.edu/pub/tex/bib/talip.bib",
abstract = "Statistical language modeling (LM), which aims to
capture the regularities in human natural language and
quantify the acceptability of a given word sequence,
has long been an interesting yet challenging research
topic in the speech and language processing community.
It also has been introduced to information retrieval
(IR) problems, and provided an effective and
theoretically attractive probabilistic framework for
building IR systems. In this article, we propose a word
topic model (WTM) to explore the co-occurrence
relationship between words, as well as the long-span
latent topical information, for language modeling in
spoken document retrieval and transcription. The
document or the search history as a whole is modeled as
a composite WTM model for generating a newly observed
word. The underlying characteristics and different
kinds of model structures are extensively investigated,
while the performance of WTM is thoroughly analyzed and
verified by comparison with the well-known
probabilistic latent semantic analysis (PLSA) model as
well as the other models. The IR experiments are
performed on the TDT Chinese collections (TDT-2 and
TDT-3), while the large vocabulary continuous speech
recognition (LVCSR) experiments are conducted on the
Mandarin broadcast news collected in Taiwan.
Experimental results seem to indicate that WTM is a
promising alternative to the existing models.",
acknowledgement = ack-nhfb,
articleno = "2",
fjournal = "ACM Transactions on Asian Language Information
Processing",
journal-URL = "http://portal.acm.org/browse_dl.cfm?&idx=J820",
keywords = "adaptation; information retrieval; language model;
speech recognition; word topic model",
}
Related entries
- adaptation,
2(1)49,
3(2)94,
5(3)209,
9(2)5,
10(2)7,
11(2)7
- aim,
6(3)9,
8(2)8,
9(3)10,
10(2)10,
10(4)20,
11(4)17,
12(4)16
- analysis,
2(4)301,
3(2)94,
3(3)169,
4(3)263,
7(1)1,
7(1)3,
7(2)5,
7(3)9,
8(3)12,
8(4)19,
9(2)6,
9(2)7,
9(3)11,
9(4)15,
10(1)4,
10(3)16,
10(4)20,
11(2)4,
11(2)7,
11(4)16,
11(4)18,
12(2)6,
13(2)9,
13(3)11
- analyzed,
6(3)9,
10(1)2
- article,
3(4)227,
4(3)321,
5(2)121,
6(2)6,
6(2)7,
6(2)8,
6(4)3,
7(1)1,
7(1)3,
7(2)5,
7(2)6,
7(2)7,
7(3)8,
7(3)9,
7(4)11,
7(4)12,
7(4)13,
8(1)3,
8(1)4,
8(2)6,
8(2)8,
8(2)9,
8(3)10,
8(3)11,
8(3)12,
8(4)14,
8(4)16,
8(4)17,
8(4)18,
9(1)2,
9(1)4,
9(2)6,
9(3)10,
9(3)11,
9(3)12,
9(4)13,
9(4)14,
10(1)3,
10(1)5,
10(1)6,
10(2)7,
10(2)9,
10(2)10,
10(3)12,
10(3)13,
10(3)14,
10(3)15,
10(4)17,
10(4)18,
10(4)20,
10(4)21,
11(1)1,
11(2)4,
11(2)5,
11(2)7,
11(3)8,
11(3)10,
11(3)11,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)17,
11(4)18,
12(1)1,
12(1)3,
12(1)4,
12(2)5,
12(2)6,
12(2)7,
12(3)9,
12(3)10,
12(3)11,
12(3)12,
12(4)14,
13(1)1,
13(1)2,
13(1)3,
13(1)4,
13(2)6,
13(2)7,
13(2)8,
13(2)9,
13(3)12,
13(3)13,
13(4)16
- attractive,
5(2)89
- been,
5(2)121,
6(3)10,
6(4)3,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(2)9,
8(4)14,
8(4)17,
8(4)18,
9(1)1,
9(2)5,
9(4)15,
10(1)5,
10(4)17,
13(1)1,
13(2)6,
13(2)8,
13(2)9,
13(3)11,
13(3)12
- broadcast,
8(1)3,
8(4)18,
9(1)2
- building,
1(2)103,
8(2)9
- capture,
7(4)12,
7(4)13,
11(3)11
- challenging,
11(4)17,
12(1)2,
13(2)10
- characteristic,
7(1)2,
8(2)9,
11(1)3,
12(1)3
- Chen, Berlin,
3(2)128,
8(1)3
- co-occurrence,
7(4)12
- collected,
13(4)16
- collections,
7(2)5,
9(3)10,
9(3)11,
9(3)12,
13(3)13
- community.,
10(4)20,
13(1)1
- comparison,
1(2)145,
1(3)225,
2(3)193,
6(3)9,
9(3)11,
9(3)12,
11(2)6,
13(1)3
- composite,
7(4)13
- conducted,
6(2)8,
7(4)12,
9(2)7,
9(3)10,
9(3)12,
11(2)4,
11(2)7,
13(1)3,
13(4)18
- continuous,
1(1)83,
7(3)10
- different,
5(2)89,
6(3)9,
6(4)3,
7(2)7,
7(3)8,
7(4)13,
8(2)7,
8(2)8,
8(3)11,
8(4)16,
8(4)17,
9(1)1,
9(1)4,
9(2)5,
9(2)6,
9(3)12,
10(1)4,
10(1)5,
10(3)12,
10(4)17,
10(4)19,
11(3)8,
11(3)11,
11(4)16,
11(4)17,
11(4)18,
12(1)2,
12(3)11,
12(4)17,
13(2)6,
13(3)11,
13(4)16
- document,
1(3)225,
2(1)1,
3(2)128,
4(3)340,
5(2)121,
6(4)2,
7(1)3,
7(2)7,
7(3)8,
8(1)1,
8(1)3,
8(3)11,
8(3)12,
8(4)19,
9(3)12,
11(2)5,
12(1)3,
13(1)1,
13(2)6,
13(2)7,
13(2)9,
13(3)13,
13(4)17
- effective,
4(2)78,
6(2)7,
6(3)11,
7(4)12,
7(4)13,
8(3)10,
9(2)5,
9(3)12,
10(2)10,
10(3)14,
10(4)17,
10(4)18,
11(2)4,
11(2)7,
11(4)18,
12(2)7,
12(4)14,
13(3)13,
13(4)16
- existing,
6(2)8,
6(4)2,
8(2)7,
9(1)3,
9(2)5,
9(4)13,
10(3)16,
11(2)4,
11(2)7,
11(4)18,
12(2)5,
12(4)17,
13(1)2,
13(2)8
- experiment,
2(2)101,
2(2)143,
5(2)146,
5(2)165,
5(3)245,
6(2)7,
6(2)8,
7(1)1,
7(1)2,
7(1)3,
7(2)5,
7(4)11,
8(2)6,
8(3)11,
8(4)17,
9(2)6,
9(2)7,
9(3)11,
9(3)12,
10(4)20,
11(2)4,
11(2)5,
11(2)7,
11(3)10,
11(3)11,
11(4)15,
11(4)17,
12(1)2,
12(2)5,
12(2)7,
12(3)9,
12(3)11,
12(3)12,
12(4)16,
12(4)17,
13(1)2,
13(1)3,
13(2)6,
13(2)8,
13(3)13,
13(4)18
- experimental,
5(2)121,
6(2)6,
6(2)7,
7(2)5,
7(2)6,
7(2)7,
7(3)10,
7(4)13,
8(1)4,
8(2)9,
9(1)1,
9(1)2,
10(2)7,
11(3)9,
11(4)14,
12(3)10,
12(4)14,
13(2)7
- explore,
6(4)2,
10(3)13,
10(3)15,
11(4)18
- extensively,
5(2)121
- framework,
3(1)11,
5(2)146,
5(4)360,
8(1)4,
8(2)9,
8(3)12,
9(1)1,
9(1)2,
9(2)5,
9(3)10,
10(3)13,
10(3)14,
10(3)15,
11(2)5,
11(4)15,
12(1)3,
12(4)15,
12(4)17,
13(2)9,
13(4)18
- generating,
5(2)165,
7(3)8,
8(4)19,
9(2)6,
12(4)15
- given,
5(2)89,
5(2)165,
7(3)10,
7(4)13,
9(1)1,
9(2)7,
11(2)5,
11(3)8,
11(3)11,
11(4)13,
12(4)14,
13(1)2,
13(4)17
- has,
5(2)89,
5(2)121,
6(4)2,
6(4)3,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(3)10,
8(4)16,
8(4)17,
8(4)18,
9(1)1,
9(1)2,
9(1)3,
9(2)5,
9(4)15,
10(1)4,
10(1)5,
10(4)17,
11(1)2,
11(3)9,
12(1)1,
12(1)2,
12(4)15,
13(1)1,
13(2)6,
13(2)7,
13(2)8,
13(3)12,
13(4)18
- history,
9(2)7,
11(2)5,
11(4)13
- human,
7(3)8,
9(2)6,
10(1)2,
10(2)10,
12(1)1,
12(4)15,
13(2)10
- indicate,
7(1)3,
7(2)5,
8(3)10,
8(4)16,
10(2)7,
12(3)11,
13(3)12
- information,
1(1)65,
1(1)83,
1(4)281,
2(3)245,
2(3)295,
3(1)1,
3(4)227,
4(2)57,
4(2)78,
4(3)243,
4(3)357,
4(4)375,
4(4)475,
5(1)44,
5(2)89,
5(3)264,
5(4)291,
5(4)296,
5(4)323,
6(2)7,
6(4)2,
7(1)2,
7(1)3,
7(2)5,
7(3)8,
7(4)12,
8(1)3,
8(3)10,
8(3)11,
8(4)15,
8(4)16,
8(4)17,
9(1)1,
9(2)7,
9(3)9,
9(3)10,
9(3)11,
9(3)12,
9(4)13,
9(4)14,
9(4)15,
10(2)8,
10(2)10,
10(3)15,
10(3)16,
10(4)19,
10(4)20,
10(4)21,
11(1)2,
11(2)6,
11(2)7,
11(4)15,
11(4)18,
12(2)5,
12(3)11,
12(4)16,
13(2)7,
13(3)13
- interesting,
11(1)1,
12(1)3
- introduced,
7(1)3,
7(2)6,
8(1)4,
10(4)21
- investigated,
5(2)121,
5(2)146,
7(1)1,
9(1)2,
11(3)10
- IR,
4(3)340,
7(3)8,
9(3)10,
9(3)11,
9(3)12,
13(2)7
- kind,
7(4)13,
8(4)16,
10(3)13,
11(2)5,
11(2)7
- large,
6(2)8,
6(3)9,
6(3)11,
7(3)8,
7(3)9,
7(4)11,
8(3)12,
8(4)18,
9(4)14,
10(2)7,
10(4)20,
10(4)21,
11(1)2,
11(3)8,
12(2)6,
12(3)9,
13(1)3,
13(2)7,
13(2)8,
13(3)13,
13(4)17,
13(4)18
- latent,
3(2)94,
7(1)3,
8(3)12,
9(2)7,
10(4)17,
11(3)11,
12(2)5
- LM,
9(2)7,
9(3)11
- long,
8(1)4,
8(3)10
- Mandarin,
3(2)128,
5(2)89,
7(3)10,
8(1)3,
9(1)2
- modeled,
12(1)2,
12(3)9
- modeling,
1(1)3,
1(3)173,
3(2)87,
3(3)169,
6(1)z,
6(2)6,
6(3)9,
7(3)10,
7(4)13,
8(1)4,
9(4)14,
10(4)18,
10(4)21,
11(2)5,
12(2)5,
13(3)12,
13(4)16
- natural,
1(2)123,
3(1)11,
5(2)121,
5(4)291,
6(2)7,
7(1)1,
7(4)13,
8(2)9,
8(4)13,
8(4)14,
8(4)16,
8(4)19,
9(2)6,
9(3)11,
9(4)15,
10(3)14,
10(4)20,
11(1)2,
11(4)14,
11(4)15,
12(1)3,
13(3)14
- newly,
13(1)1
- news,
3(1)51,
3(4)227,
8(1)3,
8(4)18,
9(1)2,
9(4)15,
11(1)2,
12(3)10
- observed,
9(2)7,
11(2)4
- occurrence, co-,
7(4)12
- other,
5(2)165,
7(2)6,
7(2)7,
7(3)8,
7(4)11,
8(2)7,
8(4)14,
8(4)16,
8(4)17,
9(1)1,
10(2)7,
10(4)20,
11(2)4,
11(2)7,
11(4)18,
12(1)1,
12(1)3,
12(3)11,
12(4)16,
13(1)3,
13(1)4,
13(2)7
- performance,
5(2)121,
5(2)165,
6(2)8,
6(3)9,
6(4)1,
6(4)3,
7(1)1,
7(1)2,
7(2)5,
7(2)6,
7(2)7,
7(3)9,
7(3)10,
7(4)13,
8(1)3,
8(2)7,
8(2)8,
8(2)9,
8(3)10,
8(4)16,
8(4)17,
8(4)18,
9(1)2,
9(1)4,
9(2)5,
9(2)6,
9(3)11,
9(3)12,
9(4)14,
10(2)8,
10(3)13,
10(3)14,
11(2)7,
11(3)10,
11(3)11,
11(4)14,
11(4)15,
11(4)17,
12(1)2,
12(3)9,
12(3)11,
12(4)14,
12(4)15,
12(4)16,
13(1)3,
13(1)4,
13(2)7,
13(2)9,
13(4)16,
13(4)17
- performed,
7(3)10,
9(3)11,
10(1)2,
12(2)7,
13(2)6,
13(4)17
- probabilistic,
4(3)340,
8(1)3,
10(1)6,
11(1)3,
11(4)15,
13(4)18
- problem,
6(2)7,
6(3)9,
6(3)11,
6(4)1,
7(1)2,
7(2)7,
7(3)10,
8(2)9,
8(3)10,
8(4)19,
9(1)1,
9(1)3,
9(2)5,
9(4)13,
10(1)2,
10(1)4,
10(3)14,
10(3)16,
10(4)21,
11(3)8,
11(3)11,
11(4)17,
11(4)18,
12(1)2,
12(1)3,
12(2)7,
12(3)10,
12(3)12,
12(4)16,
13(2)8,
13(3)14,
13(4)17
- processing,
3(1)1,
3(4)213,
4(4)375,
5(2)121,
5(4)291,
6(2)7,
6(3)9,
6(3)10,
6(4)3,
7(1)1,
7(1)3,
7(2)7,
7(4)13,
8(2)9,
8(4)13,
8(4)14,
8(4)16,
8(4)18,
8(4)19,
9(2)5,
9(2)6,
9(3)11,
9(4)15,
10(3)11,
10(3)14,
10(4)20,
11(1)2,
11(3)9,
11(4)15,
12(1)3,
12(3)10,
13(1)1,
13(2)7
- promising,
5(2)165,
9(1)3,
12(1)3,
12(2)6
- propose,
5(2)89,
6(2)6,
6(2)8,
6(3)11,
7(3)8,
7(3)10,
7(4)12,
8(1)4,
8(2)9,
8(4)19,
9(2)7,
9(4)13,
10(2)10,
10(3)12,
10(3)15,
10(4)17,
10(4)20,
11(2)7,
11(3)9,
11(3)11,
11(4)15,
11(4)16,
11(4)18,
12(1)1,
12(1)2,
12(1)3,
12(1)4,
12(2)5,
12(2)6,
12(3)9,
12(3)10,
12(3)12,
12(4)16,
13(1)2,
13(1)3,
13(2)8,
13(2)9,
13(3)12,
13(3)13,
13(4)17,
13(4)18
- provided,
11(3)10,
11(4)13
- quantify,
8(4)17,
10(2)9
- recognition,
1(1)83,
1(4)297,
2(1)27,
2(3)290,
5(1)4,
5(2)165,
6(2)6,
6(3)9,
6(4)3,
7(1)2,
7(3)10,
8(3)11,
8(4)18,
9(1)2,
9(2)7,
10(1)6,
10(2)7,
10(2)9,
10(3)13,
11(1)1,
11(1)2,
11(4)13,
11(4)16,
11(4)17,
11(4)18,
12(1)4,
12(3)10,
13(3)12,
13(4)16
- relationship,
5(3)264,
7(1)3,
9(4)15
- research,
2(2)101,
5(2)89,
7(4)12,
8(1)4,
8(4)18,
9(2)7,
9(3)12,
10(1)4,
10(3)14,
10(4)19,
10(4)20,
10(4)21,
11(1)1,
11(1)2,
11(3)10,
12(1)3,
12(4)14,
13(1)1,
13(2)7,
13(2)10
- result,
4(2)135,
5(2)121,
5(2)146,
5(2)165,
6(2)6,
6(2)7,
6(3)9,
6(3)11,
6(4)3,
7(1)2,
7(2)5,
7(2)6,
7(2)7,
7(3)8,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(1)3,
8(1)4,
8(2)6,
8(2)9,
8(3)10,
8(3)12,
8(4)14,
8(4)15,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
9(1)1,
9(1)2,
9(2)5,
9(2)6,
9(2)7,
9(3)11,
9(3)12,
9(4)14,
10(1)2,
10(2)7,
11(2)4,
11(2)5,
11(3)8,
11(3)9,
11(3)11,
11(4)13,
11(4)14,
11(4)15,
12(1)3,
12(1)4,
12(2)5,
12(2)7,
12(3)9,
12(3)10,
12(3)11,
12(4)14,
12(4)16,
13(1)1,
13(1)4,
13(2)6,
13(2)7,
13(2)9,
13(3)11,
13(3)12,
13(3)14
- retrieval,
1(3)225,
1(4)281,
2(1)1,
2(2)164,
3(2)128,
4(1)1,
4(2)57,
4(2)78,
4(2)135,
4(2)186,
4(3)340,
4(3)357,
4(4)377,
4(4)475,
5(2)89,
5(3)264,
5(4)296,
5(4)323,
6(2)8,
6(4)2,
7(2)5,
7(3)8,
7(4)12,
8(1)1,
9(1)1,
9(3)9,
9(3)10,
9(3)11,
9(3)12,
9(4)13,
9(4)14,
10(2)8,
10(4)20,
11(1)2,
11(3)11,
13(2)6,
13(2)7,
13(3)13,
13(4)18
- search,
2(3)219,
4(2)159,
4(3)280,
6(2)8,
6(4)2,
7(3)8,
8(2)8,
8(3)12,
9(1)1,
9(3)11,
10(2)9,
10(3)16,
11(3)8,
11(3)11
- semantic,
3(1)66,
3(2)94,
5(2)165,
5(3)228,
7(1)2,
7(1)3,
7(4)13,
8(2)6,
8(3)12,
8(4)15,
9(2)7,
10(1)5,
10(3)13,
10(3)14,
10(3)15,
10(4)20,
10(4)21,
11(3)8,
11(3)11,
11(4)15,
11(4)18,
12(3)11,
12(4)16
- sequence,
5(2)165,
6(2)7,
6(3)10,
7(3)9,
8(1)3,
9(2)7,
9(3)12,
9(4)14,
10(1)4,
12(1)2,
12(1)3,
12(3)9,
12(3)10,
12(4)17,
13(1)2
- speech,
1(1)83,
4(1)38,
6(3)9,
7(1)2,
7(3)10,
8(1)4,
8(4)14,
8(4)18,
9(1)2,
9(2)7,
10(1)6,
10(2)7,
11(1)2,
11(3)10,
13(4)16
- spoken,
2(1)1,
3(2)128,
6(3)10,
7(1)2,
7(3)9,
8(1)1,
8(1)3,
8(1)4,
8(4)18,
9(3)11,
12(2)6,
13(2)7
- statistical,
1(1)3,
3(2)87,
3(4)243,
5(2)121,
5(4)323,
5(4)360,
6(1)z-4,
7(1)1,
8(1)4,
8(2)6,
8(2)7,
8(2)8,
8(2)9,
8(3)10,
8(4)15,
8(4)19,
9(2)6,
9(2)7,
9(3)11,
10(4)18,
11(2)6,
11(2)7,
11(3)8,
11(4)15,
12(1)1,
12(3)12,
12(4)14,
12(4)16,
12(4)17,
13(1)2,
13(1)3,
13(1)4,
13(4)17
- structure,
4(2)186,
5(2)89,
7(1)1,
7(3)8,
7(4)13,
8(1)4,
8(4)19,
10(3)12,
10(3)14,
11(3)8,
11(4)16,
12(1)3,
12(4)17
- TDT,
6(3)11
- topic,
2(2)85,
3(4)227,
5(4)388,
6(3)11,
8(3)12,
9(2)7,
9(3)12,
9(4)15,
11(2)4,
11(2)5
- transcription,
2(1)63,
8(1)4,
8(4)18,
13(4)16
- underlying,
8(3)12,
9(1)3,
10(2)9,
10(3)12
- verified,
7(2)6,
9(2)5
- vocabulary,
6(3)9,
9(3)12,
11(2)7,
12(4)14
- well,
5(2)121,
6(2)6,
6(3)11,
7(3)8,
7(3)9,
7(3)10,
8(4)18,
9(1)2,
9(3)12,
10(3)15,
11(1)2,
11(2)4,
11(3)11,
12(3)9,
13(1)2
- which,
5(2)89,
5(2)121,
6(2)6,
6(2)8,
6(3)10,
6(4)1,
7(1)3,
7(2)7,
7(3)10,
7(4)13,
8(1)4,
8(2)9,
8(3)10,
8(3)12,
8(4)14,
8(4)16,
8(4)18,
9(1)1,
9(2)5,
9(3)12,
9(4)14,
9(4)15,
10(1)4,
10(1)6,
10(2)7,
10(2)8,
10(2)9,
10(3)12,
10(3)13,
10(3)14,
10(3)15,
10(4)17,
10(4)19,
10(4)20,
11(2)6,
11(3)8,
11(3)9,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)18,
12(1)1,
12(1)3,
12(1)4,
12(2)5,
12(2)6,
12(2)7,
12(3)10,
12(3)11,
12(4)15,
12(4)17,
13(1)1,
13(2)8,
13(3)13,
13(4)17,
13(4)18
- while,
5(2)165,
8(4)18,
9(4)15,
10(1)4,
10(3)15,
11(2)4,
11(2)5,
12(3)10,
12(3)11,
13(1)1,
13(2)8,
13(3)12,
13(3)14
- whole,
8(3)12,
12(1)3
- yet,
9(3)11