Entry Yahya:2014:ATC from talip.bib
Last update: Sun Oct 15 02:55:04 MDT 2017
Top |
Symbols |
Numbers |
Math |
A |
B |
C |
D |
E |
F |
G |
H |
I |
J |
K |
L |
M |
N |
O |
P |
Q |
R |
S |
T |
U |
V |
W |
X |
Y |
Z
BibTeX entry
@Article{Yahya:2014:ATC,
author = "Adnan Yahya and Ali Salhi",
title = "{Arabic} Text Categorization Based on {Arabic
Wikipedia}",
journal = j-TALIP,
volume = "13",
number = "1",
pages = "4:1--4:??",
month = feb,
year = "2014",
CODEN = "????",
DOI = "https://doi.org/10.1145/2537129",
ISSN = "1530-0226 (print), 1558-3430 (electronic)",
ISSN-L = "1530-0226",
bibdate = "Thu Feb 27 12:18:55 MST 2014",
bibsource = "http://portal.acm.org/;
http://www.math.utah.edu/pub/tex/bib/talip.bib",
abstract = "This article describes an algorithm for categorizing
Arabic text, relying on highly categorized corpus-based
datasets obtained from the Arabic Wikipedia by using
manual and automated processes to build and customize
categories. The categorization algorithm was built by
adopting a simple categorization idea then moving
forward to more complex ones. We applied tests and
filtration criteria to reach the best and most
efficient results that our algorithm can achieve. The
categorization depends on the statistical relations
between the input (test) text and the reference
(training) data supported by well-defined
Wikipedia-based categories. Our algorithm supports two
levels for categorizing Arabic text; categories are
grouped into a hierarchy of main categories and
subcategories. This introduces a challenge due to the
correlation between certain subcategories and overlap
between main categories. We argue that our algorithm
achieved good performance compared to other methods
reported in the literature.",
acknowledgement = ack-nhfb,
articleno = "4",
fjournal = "ACM Transactions on Asian Language Information
Processing",
journal-URL = "http://portal.acm.org/browse_dl.cfm?&idx=J820",
}
Related entries
- achieve,
7(3)9,
7(3)10,
7(4)12,
7(4)13,
8(1)4,
8(2)7,
8(3)10,
8(4)17,
9(2)6,
9(4)14,
10(2)7,
11(3)8,
11(3)11,
11(4)15,
11(4)17,
12(1)3,
12(1)4,
12(2)7,
12(3)9,
12(3)11,
13(1)3,
13(2)9
- achieved,
7(1)1,
7(2)7,
7(4)12,
7(4)13,
8(2)6,
11(4)13,
11(4)14,
12(2)5,
12(2)7
- algorithm,
1(4)281,
5(2)165,
6(3)11,
6(4)2,
6(4)3,
7(1)3,
7(2)7,
7(3)8,
7(3)10,
7(4)12,
8(1)4,
8(3)12,
9(1)3,
9(1)4,
10(2)7,
10(2)9,
10(2)10,
10(4)19,
11(1)3,
11(2)4,
11(2)7,
11(3)9,
11(3)11,
11(4)14,
12(1)1,
12(1)2,
12(2)6,
13(3)13,
13(4)18
- applied,
5(2)89,
5(2)121,
6(4)3,
8(4)19,
9(2)5,
9(3)11,
10(2)7,
13(2)10,
13(3)12,
13(4)16
- Arabic,
8(4)13,
8(4)14,
8(4)15,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
10(1)1,
10(1)2,
10(1)3,
10(1)4,
10(1)5,
11(1)2,
13(1)1,
13(2)9
- argue,
8(4)19,
11(2)6,
13(2)10
- article,
3(4)227,
4(3)321,
5(2)121,
6(2)6,
6(2)7,
6(2)8,
6(4)3,
7(1)1,
7(1)3,
7(2)5,
7(2)6,
7(2)7,
7(3)8,
7(3)9,
7(4)11,
7(4)12,
7(4)13,
8(1)2,
8(1)3,
8(1)4,
8(2)6,
8(2)8,
8(2)9,
8(3)10,
8(3)11,
8(3)12,
8(4)14,
8(4)16,
8(4)17,
8(4)18,
9(1)2,
9(1)4,
9(2)6,
9(3)10,
9(3)11,
9(3)12,
9(4)13,
9(4)14,
10(1)3,
10(1)5,
10(1)6,
10(2)7,
10(2)9,
10(2)10,
10(3)12,
10(3)13,
10(3)14,
10(3)15,
10(4)17,
10(4)18,
10(4)20,
10(4)21,
11(1)1,
11(2)4,
11(2)5,
11(2)7,
11(3)8,
11(3)10,
11(3)11,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)17,
11(4)18,
12(1)1,
12(1)3,
12(1)4,
12(2)5,
12(2)6,
12(2)7,
12(3)9,
12(3)10,
12(3)11,
12(3)12,
12(4)14,
13(1)1,
13(1)2,
13(1)3,
13(2)6,
13(2)7,
13(2)8,
13(2)9,
13(3)12,
13(3)13,
13(4)16
- automated,
7(4)13,
13(2)10
- based,
1(3)269,
2(4)301,
3(2)113,
4(3)357,
4(4)377,
5(2)121,
5(2)165,
5(3)185,
6(2)8,
6(3)9,
6(3)11,
6(4)3,
7(2)6,
7(3)10,
7(4)12,
8(1)4,
8(3)11,
8(3)12,
8(4)17,
8(4)19,
9(1)2,
9(2)5,
9(2)6,
9(2)7,
9(3)11,
10(1)4,
10(1)6,
10(2)7,
10(3)14,
10(3)16,
11(2)6,
11(3)8,
11(3)11,
11(4)14,
11(4)15,
11(4)16,
11(4)17,
11(4)18,
12(1)1,
12(1)2,
12(1)4,
12(3)9,
12(3)10,
12(3)11,
13(1)2,
13(1)3,
13(2)10,
13(3)13,
13(4)17,
13(4)18
- based, corpus-,
1(3)207,
5(2)89,
9(2)5,
9(3)12,
9(4)14
- best,
5(2)89,
5(3)183,
7(2)7,
7(4)13,
8(2)6,
9(1)3,
9(2)7,
9(3)11,
9(3)12,
11(3)8,
11(4)13,
12(1)2,
12(2)5,
12(2)7,
12(3)9,
12(4)14,
13(4)16
- build,
7(3)9,
8(2)9,
8(3)12,
13(1)3
- built,
8(2)9,
8(4)17,
11(4)15,
13(2)7
- categorization,
1(1)34,
3(3)190,
3(4)215
- categorized,
13(3)11
- category,
7(3)8,
10(1)4,
11(3)9
- certain,
9(3)11,
12(4)14
- challenge,
4(3)243,
6(3)10,
6(4)3,
8(1)4,
8(4)14,
8(4)18,
9(1)3,
10(3)12,
13(1)1,
13(2)8,
13(3)12,
13(4)17
- compared,
5(2)121,
6(3)9,
6(3)11,
8(4)16,
9(1)1,
9(3)11,
9(3)12,
10(4)17,
11(2)6,
12(1)2,
12(4)17,
13(1)2,
13(2)6,
13(3)12
- complex,
5(2)146,
7(1)1,
10(1)4,
10(2)8,
12(3)11,
13(2)8
- corpus-based,
1(3)207,
5(2)89,
9(2)5,
9(3)12,
9(4)14
- criteria,
11(2)4
- data,
2(2)143,
6(1)z,
6(1)z-1,
6(2)7,
6(3)11,
7(1)3,
7(3)9,
7(4)13,
8(1)3,
8(2)7,
8(3)10,
8(3)11,
8(3)12,
8(4)16,
8(4)18,
9(2)6,
10(2)7,
10(3)12,
10(4)20,
11(2)4,
11(3)10,
11(3)11,
11(4)13,
11(4)14,
11(4)18,
12(1)1,
12(2)7,
12(3)9,
13(1)2,
13(1)3,
13(4)16,
13(4)17,
13(4)18
- dataset,
7(4)12,
8(2)6,
9(3)10,
11(2)4,
11(4)18,
12(2)5,
12(3)10,
13(2)6
- depends,
7(1)1,
9(2)5
- describe,
6(3)9,
6(4)3,
7(2)5,
7(2)6,
7(2)7,
7(3)9,
7(4)12,
8(4)14,
9(3)10,
9(3)11,
10(1)5,
11(2)6,
12(1)3,
12(2)5,
13(1)1,
13(2)9
- due,
5(2)121,
6(2)8,
7(2)7,
9(1)1,
9(1)2,
9(4)15,
10(2)10,
10(3)12,
10(4)21,
11(2)7,
12(4)14,
13(4)17
- efficient,
2(1)63,
4(4)377,
11(2)4,
12(2)6,
12(3)12,
13(2)8,
13(4)17,
13(4)18
- good,
7(2)7,
9(2)5,
12(1)1,
12(3)12,
13(2)9
- grouped,
7(3)8
- hierarchy,
7(3)8
- highly,
5(2)121,
6(3)9,
6(4)2,
7(3)9,
8(4)18,
10(2)8,
10(4)20,
11(2)4,
12(2)5,
13(4)17
- idea,
8(3)12,
10(3)15,
11(2)6,
11(3)8
- input,
5(2)165,
8(2)7,
9(1)1,
9(1)3,
9(2)6,
10(1)6,
10(4)20,
12(1)2,
12(1)4,
12(2)6,
13(2)8,
13(3)12,
13(4)17
- introduce,
5(2)121,
7(4)11,
8(2)7,
8(3)12,
10(3)16,
12(3)9,
12(4)15,
13(1)3,
13(3)14
- level,
5(2)89,
8(4)15,
9(3)11,
10(3)12,
11(3)8,
12(3)9,
13(1)3,
13(3)12,
13(4)17
- literature,
5(1)22,
5(1)44,
11(2)7
- main,
6(3)9,
7(1)1,
7(1)2,
8(2)7,
8(3)12,
9(3)11,
11(3)8,
12(4)16
- manual,
8(1)3,
9(2)6
- more,
5(2)146,
6(2)7,
6(3)10,
7(3)9,
7(4)13,
8(1)4,
8(2)7,
8(3)12,
8(4)14,
8(4)16,
9(1)2,
9(2)6,
9(3)11,
9(3)12,
10(1)4,
10(4)19,
11(2)4,
11(2)7,
12(1)1,
12(1)2,
12(3)9,
13(1)1,
13(1)3,
13(2)8,
13(4)18
- most,
6(2)6,
7(1)1,
7(3)8,
7(3)10,
8(4)15,
9(1)1,
9(2)5,
9(3)11,
10(1)5,
10(2)8,
12(1)1,
12(1)2,
13(1)1,
13(2)6,
13(3)14,
13(4)18
- obtained,
6(3)9,
7(2)7,
8(2)9,
8(3)11,
8(4)17,
9(3)11,
11(4)16,
11(4)17,
12(3)10,
12(4)17
- one,
5(2)89,
5(2)121,
6(2)6,
6(3)9,
6(4)3,
7(3)8,
7(3)9,
7(4)11,
7(4)13,
8(2)9,
8(4)16,
8(4)17,
9(1)1,
9(2)5,
9(2)7,
9(3)12,
9(4)14,
10(1)5,
10(3)12,
10(3)13,
10(4)19,
11(2)4,
11(2)6,
11(2)7,
11(4)14,
12(1)1,
12(1)2,
12(2)5,
12(2)7,
12(3)11,
12(4)16,
13(2)10,
13(4)17,
13(4)18
- other,
5(2)165,
7(2)6,
7(2)7,
7(3)8,
7(4)11,
8(1)2,
8(2)7,
8(4)14,
8(4)16,
8(4)17,
9(1)1,
10(2)7,
10(4)20,
11(2)4,
11(2)7,
11(4)18,
12(1)1,
12(1)3,
12(3)11,
12(4)16,
13(1)3,
13(2)7
- overlap,
12(1)4
- performance,
5(2)121,
5(2)165,
6(2)8,
6(3)9,
6(4)1,
6(4)3,
7(1)1,
7(1)2,
7(2)5,
7(2)6,
7(2)7,
7(3)9,
7(3)10,
7(4)13,
8(1)2,
8(1)3,
8(2)7,
8(2)8,
8(2)9,
8(3)10,
8(4)16,
8(4)17,
8(4)18,
9(1)2,
9(1)4,
9(2)5,
9(2)6,
9(3)11,
9(3)12,
9(4)14,
10(2)8,
10(3)13,
10(3)14,
11(2)7,
11(3)10,
11(3)11,
11(4)14,
11(4)15,
11(4)17,
12(1)2,
12(3)9,
12(3)11,
12(4)14,
12(4)15,
12(4)16,
13(1)3,
13(2)7,
13(2)9,
13(4)16,
13(4)17
- process,
5(2)121,
6(2)6,
6(3)10,
7(1)1,
7(3)9,
10(2)10,
10(4)18,
12(3)9,
13(2)9
- reach,
12(1)1
- reference,
12(3)9
- relation,
1(3)173,
7(2)6,
7(4)12,
8(3)10,
9(2)7,
10(3)14,
10(3)15,
11(1)3,
11(3)11,
11(4)16,
11(4)18,
12(1)3,
13(1)2,
13(1)3
- relying,
8(2)7,
11(4)18
- reported,
7(4)13,
11(1)1,
11(1)2,
11(2)7,
13(2)6,
13(3)14
- result,
4(2)135,
5(2)121,
5(2)146,
5(2)165,
6(2)6,
6(2)7,
6(3)9,
6(3)11,
6(4)3,
7(1)2,
7(2)5,
7(2)6,
7(2)7,
7(3)8,
7(3)10,
7(4)11,
7(4)12,
7(4)13,
8(1)2,
8(1)3,
8(1)4,
8(2)6,
8(2)9,
8(3)10,
8(3)12,
8(4)14,
8(4)15,
8(4)16,
8(4)17,
8(4)18,
8(4)19,
9(1)1,
9(1)2,
9(2)5,
9(2)6,
9(2)7,
9(3)11,
9(3)12,
9(4)14,
10(1)2,
10(2)7,
11(2)4,
11(2)5,
11(3)8,
11(3)9,
11(3)11,
11(4)13,
11(4)14,
11(4)15,
12(1)3,
12(1)4,
12(2)5,
12(2)7,
12(3)9,
12(3)10,
12(3)11,
12(4)14,
12(4)16,
13(1)1,
13(2)6,
13(2)7,
13(2)9,
13(3)11,
13(3)12,
13(3)14
- simple,
9(2)5,
9(3)12,
10(4)18,
12(1)2,
12(3)9
- statistical,
1(1)3,
3(2)87,
3(4)243,
5(2)121,
5(4)323,
5(4)360,
6(1)z-4,
7(1)1,
8(1)2,
8(1)4,
8(2)6,
8(2)7,
8(2)8,
8(2)9,
8(3)10,
8(4)15,
8(4)19,
9(2)6,
9(2)7,
9(3)11,
10(4)18,
11(2)6,
11(2)7,
11(3)8,
11(4)15,
12(1)1,
12(3)12,
12(4)14,
12(4)16,
12(4)17,
13(1)2,
13(1)3,
13(4)17
- support,
6(4)3,
7(2)7,
7(3)8,
7(3)10,
12(2)6,
12(3)9,
13(4)18
- test,
6(2)6,
7(2)5,
9(1)3,
9(3)10,
9(3)11,
11(4)13,
12(3)9,
13(2)7,
13(3)13,
13(4)17
- text,
1(1)34,
1(2)159,
3(3)190,
3(4)215,
4(1)38,
4(2)135,
4(4)435,
5(1)1,
5(2)165,
6(1)z-3,
6(3)10,
6(4)2,
7(2)6,
7(3)8,
7(3)9,
8(1)4,
8(3)11,
8(4)14,
8(4)16,
8(4)18,
9(1)1,
9(3)10,
9(4)15,
10(3)14,
11(1)2,
11(2)4,
11(2)5,
11(4)13,
11(4)14,
11(4)15,
11(4)16,
11(4)17,
11(4)18,
12(1)2,
12(1)3,
12(2)6,
12(3)11,
12(4)15,
13(1)1,
13(2)7,
13(2)8,
13(2)9,
13(2)10,
13(3)14
- then,
5(2)121,
6(2)6,
7(1)1,
7(3)10,
7(4)12,
8(1)4,
8(2)7,
8(3)10,
8(3)11,
8(3)12,
8(4)14,
9(1)1,
9(2)7,
9(3)11,
10(2)7,
10(3)13,
10(4)20,
11(1)3,
11(2)7,
11(3)11,
11(4)15,
12(1)3,
12(3)10,
12(4)17,
13(2)9,
13(3)13,
13(4)16
- training,
5(2)121,
6(3)11,
7(1)1,
8(1)3,
8(2)6,
8(2)7,
8(3)10,
9(2)5,
10(3)12,
10(3)13,
11(3)9,
12(1)1,
12(2)5,
12(3)9,
12(3)10,
13(1)2,
13(1)3,
13(4)17
- two,
5(2)89,
7(2)7,
7(3)8,
7(4)11,
7(4)12,
7(4)13,
8(1)4,
8(2)7,
8(4)17,
9(1)2,
9(3)11,
9(4)13,
10(1)2,
10(3)12,
10(3)14,
10(3)15,
10(4)20,
11(2)4,
11(2)5,
11(2)7,
11(3)8,
11(3)9,
11(3)11,
11(4)17,
12(1)1,
12(1)2,
12(1)4,
12(2)5,
12(3)10,
12(3)11,
12(4)16,
13(1)1,
13(1)3,
13(2)6,
13(2)9,
13(3)11,
13(4)17
- was,
5(2)146,
6(3)9,
6(3)11,
8(4)18,
8(4)19,
9(2)7,
9(3)10,
10(4)18,
11(1)2,
11(3)10,
12(4)14,
13(4)16
- Wikipedia,
11(4)13,
11(4)16