Entry Kulick:2011:ESC from talip.bib
Last update: Sun Oct 15 02:55:04 MDT 2017
Top |
Symbols |
Numbers |
Math |
A |
B |
C |
D |
E |
F |
G |
H |
I |
J |
K |
L |
M |
N |
O |
P |
Q |
R |
S |
T |
U |
V |
W |
X |
Y |
Z
BibTeX entry
@Article{Kulick:2011:ESC,
author = "Seth Kulick",
title = "Exploiting Separation of Closed-Class Categories for
{Arabic} Tokenization and Part-of-Speech Tagging",
journal = j-TALIP,
volume = "10",
number = "1",
pages = "4:1--4:??",
month = mar,
year = "2011",
CODEN = "????",
DOI = "https://doi.org/10.1145/1929908.1929912",
ISSN = "1530-0226 (print), 1558-3430 (electronic)",
ISSN-L = "1530-0226",
bibdate = "Wed Mar 16 18:07:50 MDT 2011",
bibsource = "http://portal.acm.org/;
http://www.math.utah.edu/pub/tex/bib/talip.bib",
abstract = "Research on the problem of morphological
disambiguation of Arabic has noted that techniques
developed for lexical disambiguation in English do not
easily transfer over, since the affixation present in
Arabic creates a very different tag set than for
English, encoding both inflectional morphology and more
complex tokenization sequences. This work takes a new
approach to this problem based on a distinction between
the open-class and closed-class categories of tokens,
which differ both in their frequencies and in their
possible morphological affixations. This separation
simplifies the morphological analysis problem
considerably, making it possible to use a Conditional
Random Field model for joint tokenization and ``core''
part-of-speech tagging of the open-class items, while
the closed-class items are handled by regular
expressions.",
acknowledgement = ack-nhfb,
articleno = "4",
fjournal = "ACM Transactions on Asian Language Information
Processing",
journal-URL = "http://portal.acm.org/browse_dl.cfm?&idx=J820",
}
Related entries
- analysis,
2(4)301,
3(2)94,
3(3)169,
4(3)263,
7(1)1,
7(1)3,
7(2)5,
7(3)9,
8(1)2,
8(3)12,
8(4)19,
9(2)6,
9(2)7,
9(3)11,
9(4)15,
10(3)16,
10(4)20,
11(2)4,
11(2)7,
11(4)16,
11(4)18,
12(2)6,
13(2)9,
13(3)11
- Arabic,
8(4)13,
8(4)14,
8(4)15,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
10(1)1,
10(1)2,
10(1)3,
10(1)5,
11(1)2,
13(1)1,
13(1)4,
13(2)9
- based,
1(3)269,
2(4)301,
3(2)113,
4(3)357,
4(4)377,
5(2)121,
5(2)165,
5(3)185,
6(2)8,
6(3)9,
6(3)11,
6(4)3,
7(2)6,
7(3)10,
7(4)12,
8(1)4,
8(3)11,
8(3)12,
8(4)17,
8(4)19,
9(1)2,
9(2)5,
9(2)6,
9(2)7,
9(3)11,
10(1)6,
10(2)7,
10(3)14,
10(3)16,
11(2)6,
11(3)8,
11(3)11,
11(4)14,
11(4)15,
11(4)16,
11(4)17,
11(4)18,
12(1)1,
12(1)2,
12(1)4,
12(3)9,
12(3)10,
12(3)11,
13(1)2,
13(1)3,
13(1)4,
13(2)10,
13(3)13,
13(4)17,
13(4)18
- both,
6(2)6,
6(2)7,
6(3)10,
7(1)1,
7(1)2,
7(1)3,
7(3)8,
8(2)7,
8(3)11,
8(3)12,
9(1)2,
9(1)4,
9(2)5,
10(1)2,
10(1)6,
10(2)10,
10(3)13,
10(3)15,
10(4)20,
10(4)21,
11(2)4,
11(2)6,
11(2)7,
11(3)9,
11(4)18,
12(2)5,
12(2)7,
12(4)17,
13(2)9,
13(4)17
- category,
7(3)8,
11(3)9,
13(1)4
- complex,
5(2)146,
7(1)1,
10(2)8,
12(3)11,
13(1)4,
13(2)8
- conditional,
2(3)290,
6(4)3,
9(2)5,
10(1)6,
12(1)2
- core,
6(2)7,
8(4)15
- create,
7(2)6,
7(4)11,
9(3)10,
9(3)12
- developed,
7(2)7,
10(1)2,
10(3)12,
11(1)2,
13(4)16
- differ,
8(4)14,
9(2)5,
10(2)9
- different,
5(2)89,
6(3)9,
6(4)3,
7(2)7,
7(3)8,
7(4)13,
8(1)2,
8(2)7,
8(2)8,
8(3)11,
8(4)16,
8(4)17,
9(1)1,
9(1)4,
9(2)5,
9(2)6,
9(3)12,
10(1)5,
10(3)12,
10(4)17,
10(4)19,
11(3)8,
11(3)11,
11(4)16,
11(4)17,
11(4)18,
12(1)2,
12(3)11,
12(4)17,
13(2)6,
13(3)11,
13(4)16
- disambiguation,
2(1)49,
5(4)360,
7(2)5,
9(1)4,
12(2)7
- easily,
5(2)165,
11(3)8,
12(3)9,
13(3)13
- encoding,
6(3)10,
12(2)5
- English,
2(3)245,
4(2)135,
5(2)89,
5(2)121,
5(3)245,
6(2)6,
6(2)7,
6(3)11,
6(4)2,
7(1)1,
7(4)11,
8(2)9,
8(4)15,
8(4)16,
8(4)17,
9(1)1,
9(1)3,
9(2)7,
9(3)12,
9(4)14,
9(4)15,
10(1)2,
10(2)8,
10(3)14,
10(3)15,
10(4)17,
11(2)4,
11(2)5,
11(2)6,
11(3)8,
11(3)11,
12(2)5,
12(3)12,
12(4)14,
12(4)17,
13(1)1,
13(4)16
- exploiting,
6(2)7,
9(4)14,
11(4)16,
12(4)16
- expression,
2(4)324,
5(2)146,
5(2)165,
7(1)3,
7(2)6,
7(4)11,
8(1)4,
11(4)18,
12(3)11
- field,
2(3)290,
6(4)3,
8(4)14,
9(2)5,
9(2)7,
10(1)6,
11(4)13,
12(1)2,
12(4)15
- frequency,
10(1)2,
12(1)2,
12(2)6
- handled,
13(3)11
- has,
5(2)89,
5(2)121,
6(4)2,
6(4)3,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(1)2,
8(3)10,
8(4)16,
8(4)17,
8(4)18,
9(1)1,
9(1)2,
9(1)3,
9(2)5,
9(4)15,
10(1)5,
10(4)17,
11(1)2,
11(3)9,
12(1)1,
12(1)2,
12(4)15,
13(1)1,
13(2)6,
13(2)7,
13(2)8,
13(3)12,
13(4)18
- inflectional,
6(3)9,
7(3)9,
9(3)11,
10(2)8
- joint,
7(4)11
- lexical,
3(2)94,
5(1)4,
5(2)121,
8(2)8,
8(2)9,
8(4)15,
8(4)18,
8(4)19,
11(3)11,
11(4)14,
11(4)16,
11(4)18,
12(2)7,
12(3)12,
12(4)15,
13(1)2,
13(2)9
- making,
2(3)219,
7(1)1,
7(2)6
- more,
5(2)146,
6(2)7,
6(3)10,
7(3)9,
7(4)13,
8(1)4,
8(2)7,
8(3)12,
8(4)14,
8(4)16,
9(1)2,
9(2)6,
9(3)11,
9(3)12,
10(4)19,
11(2)4,
11(2)7,
12(1)1,
12(1)2,
12(3)9,
13(1)1,
13(1)3,
13(1)4,
13(2)8,
13(4)18
- morphological,
6(4)2,
7(3)9,
8(4)16,
9(1)3,
9(4)15,
11(3)9,
13(2)9,
13(3)14
- morphology,
7(3)9,
8(4)14,
8(4)16,
9(3)11
- new,
5(1)74,
5(2)121,
6(2)8,
6(3)9,
7(2)7,
7(4)11,
8(2)6,
9(1)4,
9(2)7,
10(3)15,
10(4)17,
10(4)20,
11(2)6,
12(1)1,
12(1)3,
12(3)8,
12(3)9,
12(4)14,
13(1)1,
13(1)2,
13(2)6
- not,
5(2)89,
5(2)121,
6(3)10,
7(2)7,
7(3)8,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(1)3,
8(2)7,
8(2)8,
8(2)9,
8(4)17,
9(2)6,
9(2)7,
9(4)14,
10(1)5,
10(2)8,
10(2)10,
10(4)18,
11(1)2,
11(3)10,
12(1)2,
12(1)3,
12(2)7,
12(3)9,
13(2)7,
13(2)9,
13(4)17,
13(4)18
- of-Speech, Part-,
11(3)9
- of-speech, part-,
1(2)145,
9(4)15,
10(1)5,
10(3)12,
11(3)9
- Part-of-Speech,
11(3)9
- part-of-speech,
1(2)145,
9(4)15,
10(1)5,
10(3)12,
11(3)9
- possible,
7(2)6,
8(4)16,
8(4)18,
9(1)1,
9(1)3,
10(3)15,
10(4)19,
12(1)2
- present,
5(2)89,
5(2)165,
6(2)7,
6(3)10,
6(4)2,
7(1)2,
7(1)3,
7(2)7,
7(3)9,
7(4)11,
7(4)13,
8(1)3,
8(2)6,
8(2)7,
8(2)8,
8(3)10,
8(4)14,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
9(1)1,
9(1)2,
9(1)3,
9(2)6,
9(4)14,
10(1)6,
10(2)7,
10(3)14,
10(4)18,
10(4)19,
11(1)2,
11(1)3,
11(2)4,
11(2)5,
11(2)6,
11(3)10,
11(4)13,
12(1)3,
12(2)5,
12(3)9,
12(3)11,
12(4)15,
13(2)8,
13(4)16
- problem,
6(2)7,
6(3)9,
6(3)11,
6(4)1,
7(1)2,
7(2)7,
7(3)10,
8(1)2,
8(2)9,
8(3)10,
8(4)19,
9(1)1,
9(1)3,
9(2)5,
9(4)13,
10(1)2,
10(3)14,
10(3)16,
10(4)21,
11(3)8,
11(3)11,
11(4)17,
11(4)18,
12(1)2,
12(1)3,
12(2)7,
12(3)10,
12(3)12,
12(4)16,
13(2)8,
13(3)14,
13(4)17
- random,
2(3)290,
6(4)3,
9(2)5,
10(1)6,
11(4)13,
12(1)2,
12(3)9
- research,
2(2)101,
5(2)89,
7(4)12,
8(1)2,
8(1)4,
8(4)18,
9(2)7,
9(3)12,
10(3)14,
10(4)19,
10(4)20,
10(4)21,
11(1)1,
11(1)2,
11(3)10,
12(1)3,
12(4)14,
13(1)1,
13(2)7,
13(2)10
- separation,
8(4)16
- sequence,
5(2)165,
6(2)7,
6(3)10,
7(3)9,
8(1)2,
8(1)3,
9(2)7,
9(3)12,
9(4)14,
12(1)2,
12(1)3,
12(3)9,
12(3)10,
12(4)17,
13(1)2
- set,
1(3)269,
5(2)121,
6(1)z,
7(1)3,
7(3)8,
7(4)11,
7(4)13,
8(3)10,
8(3)12,
8(4)15,
9(1)1,
9(1)3,
9(2)5,
10(2)8,
10(4)20,
11(2)5,
11(2)7,
11(3)10,
11(3)11,
11(4)13,
11(4)14,
12(1)2,
12(1)4,
12(3)9,
13(2)8,
13(2)9,
13(3)12,
13(3)13,
13(4)17
- since,
5(2)89,
5(2)165,
8(2)9,
8(4)16,
8(4)18,
10(1)5,
10(4)19,
10(4)21,
11(2)7,
11(4)18,
12(1)2,
12(4)16,
13(4)17
- Speech, Part-of-,
11(3)9
- speech, part-of-,
1(2)145,
9(4)15,
10(1)5,
10(3)12,
11(3)9
- tag,
9(2)5
- tagging,
1(2)145,
3(1)51,
9(2)5,
9(4)15,
11(2)7,
13(1)1
- take,
8(2)8,
10(4)20,
11(2)7
- technique,
2(1)63,
3(4)243,
5(2)89,
6(1)z,
6(2)7,
6(2)8,
6(3)9,
6(4)2,
6(4)3,
7(2)5,
7(2)7,
7(3)8,
7(4)12,
8(4)18,
9(1)3,
9(2)5,
10(2)9,
10(2)10,
10(4)21,
11(1)1,
12(2)6,
12(3)9,
12(3)11,
12(4)14,
13(2)8,
13(3)12,
13(3)13,
13(4)18
- than,
5(2)146,
6(3)10,
7(3)8,
7(4)11,
7(4)13,
8(2)8,
8(4)16,
9(1)2,
9(2)7,
9(3)11,
9(3)12,
10(1)3,
10(3)14,
11(2)4,
11(2)7,
11(3)8,
11(3)9,
11(4)13,
11(4)15,
12(2)7,
12(3)10,
12(4)16,
13(1)1,
13(4)17
- tokenization,
9(1)4
- use,
4(2)159,
5(2)89,
5(2)146,
6(2)8,
6(3)11,
7(2)6,
7(3)9,
7(4)11,
7(4)12,
8(1)3,
8(2)9,
8(3)10,
8(3)11,
9(1)1,
9(1)3,
9(3)11,
10(1)3,
11(1)1,
11(2)6,
11(2)7,
11(3)8,
11(3)10,
11(4)14,
11(4)18,
12(1)1,
12(2)6,
12(3)9,
12(3)10,
13(2)6,
13(2)9,
13(2)10,
13(3)12
- very,
5(2)89,
7(4)11,
8(3)12,
8(4)16,
8(4)18,
10(4)18,
12(3)12
- which,
5(2)89,
5(2)121,
6(2)6,
6(2)8,
6(3)10,
6(4)1,
7(1)3,
7(2)7,
7(3)10,
7(4)13,
8(1)2,
8(1)4,
8(2)9,
8(3)10,
8(3)12,
8(4)14,
8(4)16,
8(4)18,
9(1)1,
9(2)5,
9(3)12,
9(4)14,
9(4)15,
10(1)6,
10(2)7,
10(2)8,
10(2)9,
10(3)12,
10(3)13,
10(3)14,
10(3)15,
10(4)17,
10(4)19,
10(4)20,
11(2)6,
11(3)8,
11(3)9,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)18,
12(1)1,
12(1)3,
12(1)4,
12(2)5,
12(2)6,
12(2)7,
12(3)10,
12(3)11,
12(4)15,
12(4)17,
13(1)1,
13(2)8,
13(3)13,
13(4)17,
13(4)18
- while,
5(2)165,
8(1)2,
8(4)18,
9(4)15,
10(3)15,
11(2)4,
11(2)5,
12(3)10,
12(3)11,
13(1)1,
13(2)8,
13(3)12,
13(3)14
- work,
5(2)121,
6(2)6,
6(3)11,
6(4)2,
7(2)7,
7(3)9,
8(4)19,
9(2)5,
9(4)15,
10(2)10,
12(1)3,
12(3)9,
13(1)1,
13(2)9,
13(3)14,
13(4)18