Entry Farghaly:2009:ANL from talip.bib
Last update: Sun Oct 15 02:55:04 MDT 2017
Top |
Symbols |
Numbers |
Math |
A |
B |
C |
D |
E |
F |
G |
H |
I |
J |
K |
L |
M |
N |
O |
P |
Q |
R |
S |
T |
U |
V |
W |
X |
Y |
Z
BibTeX entry
@Article{Farghaly:2009:ANL,
author = "Ali Farghaly and Khaled Shaalan",
title = "{Arabic} Natural Language Processing: Challenges and
Solutions",
journal = j-TALIP,
volume = "8",
number = "4",
pages = "14:1--14:??",
month = dec,
year = "2009",
CODEN = "????",
DOI = "https://doi.org/10.1145/1644879.1644881",
ISSN = "1530-0226 (print), 1558-3430 (electronic)",
ISSN-L = "1530-0226",
bibdate = "Mon Mar 29 15:37:17 MDT 2010",
bibsource = "http://portal.acm.org/;
http://www.math.utah.edu/pub/tex/bib/talip.bib",
abstract = "The Arabic language presents researchers and
developers of natural language processing (NLP)
applications for Arabic text and speech with serious
challenges. The purpose of this article is to describe
some of these challenges and to present some solutions
that would guide current and future practitioners in
the field of Arabic natural language processing (ANLP).
We begin with general features of the Arabic language
in Sections 1, 2, and 3 and then we move to more
specific properties of the language in the rest of the
article. In Section 1 of this article we highlight the
significance of the Arabic language today and describe
its general properties. Section 2 presents the feature
of Arabic Diglossia showing how the sociolinguistic
aspects of the Arabic language differ from other
languages. The stability of Arabic Diglossia and its
implications for ANLP applications are discussed and
ways to deal with this problematic property are
proposed. Section 3 deals with the properties of the
Arabic script and the explosion of ambiguity that
results from the absence of short vowel representations
and overt case markers in contemporary Arabic texts. We
present in Section 4 specific features of the Arabic
language such as the nonconcatenative property of
Arabic morphology, Arabic as an agglutinative language,
Arabic as a pro-drop language, and the challenge these
properties pose to ANLP. We also present solutions that
have already been adopted by some pioneering
researchers in the field. In Section 5 we point out to
the lack of formal and explicit grammars of Modern
Standard Arabic which impedes the progress of more
advanced ANLP systems. In Section 6 we draw our
conclusion.",
acknowledgement = ack-nhfb,
articleno = "14",
fjournal = "ACM Transactions on Asian Language Information
Processing",
journal-URL = "http://portal.acm.org/browse_dl.cfm?&idx=J820",
keywords = "Arabic dialects; Arabic script; Modern Standard
Arabic",
}
Related entries
- adopted,
5(2)165,
9(3)10,
10(2)7,
12(1)2
- already,
5(2)89,
11(2)6
- ambiguity,
7(2)5,
8(4)15
- application,
1(2)103,
4(4)475,
6(2)7,
6(4)2,
7(1)2,
7(2)7,
7(3)8,
7(4)11,
7(4)13,
8(2)7,
8(2)9,
8(3)10,
9(2)7,
9(4)13,
10(2)10,
10(4)19,
11(4)17,
12(3)11
- Arabic,
8(4)13,
8(4)15,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
10(1)1,
10(1)2,
10(1)3,
10(1)4,
10(1)5,
11(1)2,
13(1)1,
13(1)4,
13(2)9
- article,
3(4)227,
4(3)321,
5(2)121,
6(2)6,
6(2)7,
6(2)8,
6(4)3,
7(1)1,
7(1)3,
7(2)5,
7(2)6,
7(2)7,
7(3)8,
7(3)9,
7(4)11,
7(4)12,
7(4)13,
8(1)2,
8(1)3,
8(1)4,
8(2)6,
8(2)8,
8(2)9,
8(3)10,
8(3)11,
8(3)12,
8(4)16,
8(4)17,
8(4)18,
9(1)2,
9(1)4,
9(2)6,
9(3)10,
9(3)11,
9(3)12,
9(4)13,
9(4)14,
10(1)3,
10(1)5,
10(1)6,
10(2)7,
10(2)9,
10(2)10,
10(3)12,
10(3)13,
10(3)14,
10(3)15,
10(4)17,
10(4)18,
10(4)20,
10(4)21,
11(1)1,
11(2)4,
11(2)5,
11(2)7,
11(3)8,
11(3)10,
11(3)11,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)17,
11(4)18,
12(1)1,
12(1)3,
12(1)4,
12(2)5,
12(2)6,
12(2)7,
12(3)9,
12(3)10,
12(3)11,
12(3)12,
12(4)14,
13(1)1,
13(1)2,
13(1)3,
13(1)4,
13(2)6,
13(2)7,
13(2)8,
13(2)9,
13(3)12,
13(3)13,
13(4)16
- aspect,
4(1)1,
7(2)7
- been,
5(2)121,
6(3)10,
6(4)3,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(1)2,
8(2)9,
8(4)17,
8(4)18,
9(1)1,
9(2)5,
9(4)15,
10(1)5,
10(4)17,
13(1)1,
13(2)6,
13(2)8,
13(2)9,
13(3)11,
13(3)12
- begin,
9(4)15
- case,
8(2)8,
9(2)5,
9(3)12,
10(3)12,
10(4)18,
12(1)1,
12(1)2,
13(2)8
- challenge,
4(3)243,
6(3)10,
6(4)3,
8(1)4,
8(4)18,
9(1)3,
10(3)12,
13(1)1,
13(1)4,
13(2)8,
13(3)12,
13(4)17
- conclusion,
13(3)11
- current,
9(1)3,
9(2)5,
10(1)6,
13(1)2
- deal,
7(1)3,
13(3)11
- describe,
6(3)9,
6(4)3,
7(2)5,
7(2)6,
7(2)7,
7(3)9,
7(4)12,
9(3)10,
9(3)11,
10(1)5,
11(2)6,
12(1)3,
12(2)5,
13(1)1,
13(1)4,
13(2)9
- differ,
9(2)5,
10(1)4,
10(2)9
- discussed,
6(2)7,
9(2)5
- explicit,
12(2)5,
13(3)12
- feature,
2(3)290,
5(2)165,
6(4)1,
7(2)6,
7(2)7,
7(3)10,
7(4)13,
8(3)11,
8(4)17,
9(1)2,
9(2)5,
9(2)6,
10(1)5,
10(1)6,
10(2)7,
10(3)13,
10(3)15,
10(4)17,
10(4)19,
10(4)21,
11(3)10,
11(4)14,
11(4)16,
12(1)1,
12(1)4,
12(3)9,
12(3)10,
13(2)9,
13(3)13,
13(4)16
- field,
2(3)290,
6(4)3,
9(2)5,
9(2)7,
10(1)4,
10(1)6,
11(4)13,
12(1)2,
12(4)15
- future,
11(2)7,
11(3)10
- general,
9(3)12,
10(3)12,
11(2)6,
11(2)7,
11(3)10,
12(2)6,
12(4)14,
12(4)15
- grammar,
1(2)123,
3(2)113,
7(1)1,
10(3)12,
10(4)18,
11(3)8,
11(3)9,
12(4)15,
13(3)11
- guide,
13(2)9
- have,
5(2)121,
6(3)10,
6(4)2,
7(2)7,
7(3)8,
7(4)11,
7(4)12,
7(4)13,
8(2)8,
8(2)9,
8(4)16,
8(4)17,
8(4)18,
9(1)1,
9(1)3,
9(2)7,
9(4)15,
10(1)5,
10(2)7,
10(4)19,
10(4)20,
10(4)21,
11(1)2,
11(2)6,
11(3)8,
12(1)3,
12(2)6,
13(1)3,
13(2)6,
13(2)7,
13(2)9,
13(3)11,
13(3)12
- how,
5(2)146,
6(4)3,
7(1)2,
7(3)9,
7(4)12,
8(4)16,
9(2)5,
9(3)12,
11(3)8,
12(4)14,
13(2)9,
13(2)10
- lack,
7(3)9,
9(1)1,
12(2)6,
12(2)7
- marker,
4(4)435,
8(2)8
- Modern,
8(4)18
- more,
5(2)146,
6(2)7,
6(3)10,
7(3)9,
7(4)13,
8(1)4,
8(2)7,
8(3)12,
8(4)16,
9(1)2,
9(2)6,
9(3)11,
9(3)12,
10(1)4,
10(4)19,
11(2)4,
11(2)7,
12(1)1,
12(1)2,
12(3)9,
13(1)1,
13(1)3,
13(1)4,
13(2)8,
13(4)18
- morphology,
7(3)9,
8(4)16,
9(3)11,
10(1)4
- natural,
1(2)123,
3(1)11,
5(2)121,
5(4)291,
6(2)7,
7(1)1,
7(4)13,
8(1)2,
8(2)9,
8(4)13,
8(4)16,
8(4)19,
9(2)6,
9(3)11,
9(4)15,
10(3)14,
10(4)20,
11(1)2,
11(4)14,
11(4)15,
12(1)3,
13(3)14
- NLP,
5(2)121,
6(4)3,
9(4)15,
10(1)5,
10(4)19,
11(4)15,
13(2)7
- other,
5(2)165,
7(2)6,
7(2)7,
7(3)8,
7(4)11,
8(1)2,
8(2)7,
8(4)16,
8(4)17,
9(1)1,
10(2)7,
10(4)20,
11(2)4,
11(2)7,
11(4)18,
12(1)1,
12(1)3,
12(3)11,
12(4)16,
13(1)3,
13(1)4,
13(2)7
- pioneering,
7(3)9
- point,
6(2)8,
10(1)6,
12(3)9,
12(4)16,
13(2)6,
13(4)17
- pose,
7(1)3,
9(1)1
- present,
5(2)89,
5(2)165,
6(2)7,
6(3)10,
6(4)2,
7(1)2,
7(1)3,
7(2)7,
7(3)9,
7(4)11,
7(4)13,
8(1)3,
8(2)6,
8(2)7,
8(2)8,
8(3)10,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
9(1)1,
9(1)2,
9(1)3,
9(2)6,
9(4)14,
10(1)4,
10(1)6,
10(2)7,
10(3)14,
10(4)18,
10(4)19,
11(1)2,
11(1)3,
11(2)4,
11(2)5,
11(2)6,
11(3)10,
11(4)13,
12(1)3,
12(2)5,
12(3)9,
12(3)11,
12(4)15,
13(2)8,
13(4)16
- processing,
3(1)1,
3(4)213,
4(4)375,
5(2)121,
5(4)291,
6(2)7,
6(3)9,
6(3)10,
6(4)3,
7(1)1,
7(1)3,
7(2)7,
7(4)13,
8(1)2,
8(2)9,
8(4)13,
8(4)16,
8(4)18,
8(4)19,
9(2)5,
9(2)6,
9(3)11,
9(4)15,
10(3)11,
10(3)14,
10(4)20,
11(1)2,
11(3)9,
11(4)15,
12(1)3,
12(3)10,
13(1)1,
13(2)7
- progress,
9(4)15,
10(3)14
- property,
6(2)7,
8(3)11,
9(2)6,
11(3)9
- proposed,
5(2)121,
5(2)165,
6(2)7,
7(1)1,
7(1)2,
7(3)9,
7(3)10,
7(4)11,
7(4)13,
8(1)4,
8(2)6,
8(3)10,
8(3)11,
8(4)19,
9(1)1,
9(2)5,
9(2)7,
10(2)7,
10(2)9,
10(3)14,
10(4)18,
11(1)3,
11(2)5,
11(2)6,
11(2)7,
11(3)8,
11(3)9,
11(3)10,
11(3)11,
11(4)16,
11(4)17,
12(1)4,
12(2)5,
12(2)7,
12(3)12,
12(4)16,
12(4)17,
13(2)6,
13(2)8,
13(3)13,
13(4)18
- purpose,
11(3)10
- representation,
1(3)207,
6(2)7,
8(2)7,
8(3)12,
11(4)15,
13(2)9
- researchers,
9(2)7,
11(1)1,
11(1)2,
11(3)8,
11(4)15,
13(1)3
- result,
4(2)135,
5(2)121,
5(2)146,
5(2)165,
6(2)6,
6(2)7,
6(3)9,
6(3)11,
6(4)3,
7(1)2,
7(2)5,
7(2)6,
7(2)7,
7(3)8,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(1)2,
8(1)3,
8(1)4,
8(2)6,
8(2)9,
8(3)10,
8(3)12,
8(4)15,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
9(1)1,
9(1)2,
9(2)5,
9(2)6,
9(2)7,
9(3)11,
9(3)12,
9(4)14,
10(1)2,
10(2)7,
11(2)4,
11(2)5,
11(3)8,
11(3)9,
11(3)11,
11(4)13,
11(4)14,
11(4)15,
12(1)3,
12(1)4,
12(2)5,
12(2)7,
12(3)9,
12(3)10,
12(3)11,
12(4)14,
12(4)16,
13(1)1,
13(1)4,
13(2)6,
13(2)7,
13(2)9,
13(3)11,
13(3)12,
13(3)14
- script,
1(4)297,
6(2)8,
7(4)11,
8(3)11,
11(1)1,
12(2)6,
12(3)9,
13(2)6
- section,
5(3)183
- short,
8(3)10,
8(3)12,
12(1)2
- significance,
11(2)6,
13(3)11,
13(3)13
- solution,
6(3)10,
8(2)9,
8(3)12,
8(4)19,
9(3)11,
12(1)2,
12(2)5,
12(2)6
- specific,
7(2)7,
8(2)7,
11(4)15,
11(4)17,
12(1)3,
12(1)4,
12(2)6
- speech,
1(1)83,
4(1)38,
6(3)9,
7(1)2,
7(3)10,
8(1)2,
8(1)4,
8(4)18,
9(1)2,
9(2)7,
10(1)6,
10(2)7,
11(1)2,
11(3)10,
13(4)16
- standard,
6(3)10,
7(4)11,
8(4)15,
8(4)18,
9(1)1,
9(2)5,
9(2)6,
10(3)12,
11(2)5,
11(4)18,
13(2)7,
13(3)13,
13(4)17
- such,
7(2)7,
7(3)8,
7(3)10,
7(4)12,
8(2)8,
8(3)10,
8(3)11,
8(3)12,
8(4)16,
8(4)17,
9(1)1,
9(3)12,
9(4)13,
9(4)15,
10(1)5,
10(2)8,
10(3)12,
10(4)21,
11(1)2,
11(2)5,
11(2)7,
11(3)8,
11(3)10,
11(3)11,
11(4)13,
11(4)16,
11(4)17,
11(4)18,
12(1)1,
12(1)2,
12(2)6,
12(3)10,
12(3)11,
12(4)14,
12(4)17,
13(1)1,
13(3)12,
13(4)17
- text,
1(1)34,
1(2)159,
3(3)190,
3(4)215,
4(1)38,
4(2)135,
4(4)435,
5(1)1,
5(2)165,
6(1)z-3,
6(3)10,
6(4)2,
7(2)6,
7(3)8,
7(3)9,
8(1)4,
8(3)11,
8(4)16,
8(4)18,
9(1)1,
9(3)10,
9(4)15,
10(3)14,
11(1)2,
11(2)4,
11(2)5,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)17,
11(4)18,
12(1)2,
12(1)3,
12(2)6,
12(3)11,
12(4)15,
13(1)1,
13(1)4,
13(2)7,
13(2)8,
13(2)9,
13(2)10,
13(3)14
- then,
5(2)121,
6(2)6,
7(1)1,
7(3)10,
7(4)12,
8(1)4,
8(2)7,
8(3)10,
8(3)11,
8(3)12,
9(1)1,
9(2)7,
9(3)11,
10(2)7,
10(3)13,
10(4)20,
11(1)3,
11(2)7,
11(3)11,
11(4)15,
12(1)3,
12(3)10,
12(4)17,
13(1)4,
13(2)9,
13(3)13,
13(4)16
- today,
9(4)14
- way,
5(2)89,
6(2)7,
8(3)12,
9(2)5,
10(4)17
- which,
5(2)89,
5(2)121,
6(2)6,
6(2)8,
6(3)10,
6(4)1,
7(1)3,
7(2)7,
7(3)10,
7(4)13,
8(1)2,
8(1)4,
8(2)9,
8(3)10,
8(3)12,
8(4)16,
8(4)18,
9(1)1,
9(2)5,
9(3)12,
9(4)14,
9(4)15,
10(1)4,
10(1)6,
10(2)7,
10(2)8,
10(2)9,
10(3)12,
10(3)13,
10(3)14,
10(3)15,
10(4)17,
10(4)19,
10(4)20,
11(2)6,
11(3)8,
11(3)9,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)18,
12(1)1,
12(1)3,
12(1)4,
12(2)5,
12(2)6,
12(2)7,
12(3)10,
12(3)11,
12(4)15,
12(4)17,
13(1)1,
13(2)8,
13(3)13,
13(4)17,
13(4)18
- would,
9(2)7,
9(3)11,
10(1)5,
12(3)9,
12(3)11