-
Notifications
You must be signed in to change notification settings - Fork 9
/
refs.bib
236 lines (207 loc) · 10.8 KB
/
refs.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
%% about CODA
@inproceedings{Habash2018unified,
Address = {Miyazaki, Japan},
Author = {Nizar Habash and Fadhl Eryani and Salam Khalifa and Owen Rambow and Dana Abdulrahim and Alexander Erdmann and Reem Faraj and Wajdi Zaghouani and Houda Bouamor and Nasser Zalmout and Sara Hassan and Faisal Al shargi and Sakhar Alkhereyf and Basma Abdulkareem and Ramy Eskander and Mohammad Salameh and Hind Saddiki},
Booktitle = {Proceedings of the Language Resources and Evaluation Conference (LREC)},
Title = {Unified Guidelines and Resources for {A}rabic Dialect Orthography},
url = {https://www.aclweb.org/anthology/L18-1574.pdf},
Year = {2018}}
%% about CODA
@inproceedings{Zribi2014conventional,
Address = {Reykjavik, Iceland},
Author = {Ines Zribi and Rahma Boujelbane and Abir Masmoudi and Mariem Ellouze and Lamia Belguith and Nizar Habash},
Booktitle = {Proceedings of the Language Resources and Evaluation Conference (LREC)},
Title = {A Conventional Orthography for {T}unisian {A}rabic},
url={http://www.lrec-conf.org/proceedings/lrec2014/pdf/219_Paper.pdf},
Year = {2014}}
%% about CODA
@inproceedings{Turki2016conventional,
Address = {Portoro\v{z}, Slovenia},
Author = {Turki, Houcemeddine and Adel, Emad and Daouda, Tariq and Regragui, Nassim},
Booktitle = {Proceedings of the Language Resources and Evaluation Conference (LREC)},
Date-Modified = {2018-09-28 14:31:37 +0400},
Title = {{A Conventional Orthography for Maghrebi {A}rabic}},
url={https://www.researchgate.net/profile/Houcemeddine_Turki/publication/311589181_A_Conventional_Orthography_for_Maghrebi_Arabic/links/584fd40608ae4bc8993b35ae.pdf},
Year = {2016}}
%% about CODA
@techreport{Habash2015palestinian,
Author = {Nizar Habash and Mustafa Jarrar and Faeq Alrimawi and Diyam Akra and Nasser Zalmout and Eric Bartolotti and Mahdi Arar},
Institution = {Birzeit University and New York Univesity Abu Dhabi},
Title = {Palestinian {A}rabic Conventional Orthography Guidelines},
url={http://www.jarrar.info/publications/HR15.pdf},
Year = {2015}}
%% about CODA
@inproceedings{Saadane2015conventional,
Address = {Beijing, China},
Author = {Saadane, Houda and Habash, Nizar},
Booktitle = {Proceedings of the Workshop for {A}rabic Natural Language Processing (WANLP)},
Pages = {69},
Title = {{A Conventional Orthography for Algerian {A}rabic}},
url={https://www.aclweb.org/anthology/W15-3208.pdf},
Year = {2015}}
%% about CODA
@inproceedings{Habash2012conventional,
Address = {Istanbul, Turkey},
Author = {Nizar Habash and Mona Diab and Owen Rambow},
Booktitle = {Proceedings of the Language Resources and Evaluation Conference (LREC)},
Pages = {711--718},
Title = {{{C}onventional {O}rthography for {D}ialectal {A}rabic}},
url={http://www.lrec-conf.org/proceedings/lrec2012/pdf/579_Paper.pdf},
Year = {2012}}
%% about CODA
@techreport{Habash2011conventional,
Author = {Nizar Habash and Mona Diab and Owen Rambow},
Institution = {Columbia University Center for Computational Learning Systems},
Number = {CCLS-11-02},
Title = {{Conventional Orthography for Dialectal {A}rabic (CODA) Version 0.1}},
url={https://academiccommons.columbia.edu/doi/10.7916/D8V69SG2/download},
Year = {2011}}
%% about CODA (brief mention)
@article{Guellil2019arabic,
title = "Arabic Natural Language Processing: An Overview",
journal = "Journal of King Saud University - Computer and Information Sciences",
year = "2019",
issn = "1319-1578",
doi = "https://doi.org/10.1016/j.jksuci.2019.02.006",
url = "http://www.sciencedirect.com/science/article/pii/S1319157818310553",
author = "Imane Guellil and Houda Saâdane and Faical Azouaou and Billel Gueni and Damien Nouvel",
keywords = "Arabic, MSA, AD, CA, Arabizi, Basic analysis, Identification, Building Resources, Machine translation, Sentiment analysis, Transliteration",
abstract = "Arabic is recognised as the 4th most used language of the Internet. Arabic has three main varieties: (1) classical Arabic (CA), (2) Modern Standard Arabic (MSA), (3) Arabic Dialect (AD). MSA and AD could be written either in Arabic or in Roman script (Arabizi), which corresponds to Arabic written with Latin letters, numerals and punctuation. Due to the complexity of this language and the number of corresponding challenges for NLP, many surveys have been conducted, in order to synthesise the work done on Arabic. However these surveys principally focus on two varieties of Arabic (MSA and AD, written in Arabic letters only), they are slightly old (no such survey since 2015) and therefore do not cover recent resources and tools. To bridge the gap, we propose a survey focusing on 90 recent research papers (74% of which were published after 2015). Our study presents and classifies the work done on the three varieties of Arabic, by concentrating on both Arabic and Arabizi, and associates each work to its publicly available resources whenever available."
}
%% using CODA
@inproceedings{Zalmout2018noiserobust,
Address = {New Orleans, Louisiana, USA},
Author = {Nasser Zalmout and Alexander Erdmann and Nizar Habash},
Booktitle = {Proceedings of the Conference of the North American Chapter of the Association for Computational Linguistics (NAACL)},
Title = {Noise-Robust Morphological Disambiguation for Dialectal {A}rabic},
url={https://www.aclweb.org/anthology/N18-1087.pdf},
Year = {2018}}
%% using CODA
@inproceedings{Erdmann2018addressing,
Address = {Melbourne, Australia},
Author = {Alexander Erdmann and Nasser Zalmout and Nizar Habash},
Booktitle = {Proceedings of the Conference of the Association for Computational Linguistics (ACL)},
Title = {Addressing Noise in Multidialectal Word Embeddings},
url={https://www.aclweb.org/anthology/P18-2089.pdf},
Year = {2018}}
%% using CODA
@inproceedings{AlTwairesh2018suar,
Author = {Nora Al-Twairesh and Rawan Al-Matham and Nora Madi and Nada Almugren and Al-Hanouf Al-Aljmi and Shahad Alshalan and Raghad Alshalan and Nafla Alrumayyan and Shams Al-Manea and Sumayah Bawazeer and Nourah Al-Mutlaq and Nada Almanea and Waad Bin~Huwaymil and Dalal Alqusair and Reem Alotaibi and Suha Al-Senaydi and Abeer Alfutamani},
Booktitle = {Proceedings of the International Conference on {A}rabic Computational Linguistics (ACLing)},
Date-Added = {2018-10-11 21:38:15 +0400},
Date-Modified = {2018-10-11 21:42:03 +0400},
Title = {{SUAR}: Towards Building a Corpus for the {S}audi Dialect},
url={http://fac.ksu.edu.sa/sites/default/files/suar.pdf},
Year = {2018}}
%% using CODA
@article{Zalmout2019joint,
title={Joint Diacritization, Lemmatization, Normalization, and Fine-Grained Morphological Tagging},
author={Zalmout, Nasser and Habash, Nizar},
journal={arXiv preprint arXiv:1910.02267},
url={https://arxiv.org/abs/1910.02267},
year={2019}
}
%% using CODA
@article{Gugliotta2020tarc,
title={TArC: Incrementally and Semi-Automatically Collecting a Tunisian arabish Corpus},
author={Gugliotta, Elisa and Dinarelli, Marco},
journal={arXiv preprint arXiv:2003.09520},
url={http://www.lrec-conf.org/proceedings/lrec2020/pdf/2020.lrec-1.770.pdf},
year={2020}
}
%% using CODA
@misc{Zahra2020targeted,
title={Targeted Topic Modeling for Levantine {A}rabic},
author={Zahra, Shorouq},
url={https://www.diva-portal.org/smash/get/diva2:1439483/FULLTEXT01.pdf},
year={2020}
}
%% using CODA
@article{Alkhwiter2020partofspeech,
title={Part-of-Speech Tagging for {A}rabic Tweets Using CRF and Bi-LSTM},
author={AlKhwiter, Wasan and Al-Twairesh, Nora},
journal={Computer Speech \& Language},
url={https://www.sciencedirect.com/science/article/pii/S0885230820300711?casa_token=drTyaeip1vwAAAAA:I0QYQTH6-j7geAmGb2x_0JzydWAERNQGOCs-5g6g_lumIZWlvAH5TiGm6nzPdsJm3fRe9zKZ},
year={2020},
volume={65},
pages={101138},
publisher={Elsevier}
}
%% using CODA
@phdthesis{zalmout2020morphological,
title={Morphological Tagging and Disambiguation in Dialectal {A}rabic Using Deep Learning Architectures},
author={Zalmout, Nasser},
url={https://search.proquest.com/docview/2385667717?pq-origsite=gscholar&fromopenview=true},
year={2020},
school={New York University Tandon School of Engineering}
}
%% using CODA
@article{Choueiri2019transcription,
journal={},
title={Transcription de Corpus Oraux d’Arabe Parl{\'e} en Interaction. Convention AraPI et Annexes.},
author={Choueiri, Lina and Dimachki, Loubna and Pinon, Catherine and Traverso, V{\'e}ronique},
url={https://hal.archives-ouvertes.fr/hal-02153116/document},
year={2019}
}
%% using CODA
@misc{learnpalestinianarabic2016,
title={Learn Palestinian {A}rabic,
the Spoken Dialect of Palestine},
url={https://web.archive.org/web/20200223170950/http://www.learnpalestinianarabic.com/writingsystem.html},
journal={LearnPalestinianArabic.com}, year={2016}}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%% catib citations
@inproceedings{habash2009catib,
title={Catib: The Columbia {A}rabic Treebank},
author={Habash, Nizar and Roth, Ryan},
booktitle={Proceedings of the ACL-IJCNLP 2009 conference short papers},
pages={221--224},
url={https://www.aclweb.org/anthology/P09-2056.pdf},
year={2009}
}
%% catib citations
@inproceedings{habash2009syntactic,
title={Syntactic Annotation in the Columbia {A}rabic Treebank},
author={Habash, Nizar and Faraj, Reem and Roth, Ryan},
booktitle={Proceedings of MEDAR International Conference on {A}rabic Language Resources and Tools, Cairo, Egypt},
url={http://www.elda.org/medar-conference/pdf/25.pdf},
year={2009}
}
%% catib citations
@article{taji2019arabic,
title={An {A}rabic Dependency Treebank in the Travel Domain},
author={Taji, Dima and Gizuli, Jamila El and Habash, Nizar},
journal={arXiv preprint arXiv:1901.10188},
url={http://lrec-conf.org/workshops/lrec2018/W30/pdf/14_W30.pdf},
year={2019}
}
%% catib citations
@inproceedings{shahrour2016camelparser,
title={Camelparser: A System for {A}rabic Syntactic Analysis and Morphological Disambiguation},
author={Shahrour, Anas and Khalifa, Salam and Taji, Dima and Habash, Nizar},
booktitle={Proceedings of COLING 2016, the 26th International Conference on Computational Linguistics: System Demonstrations},
pages={228--232},
url={https://www.aclweb.org/anthology/C16-2048.pdf},
year={2016}
}
%% catib citations
@inproceedings{shahrour2015improving,
title={Improving {A}rabic Diacritization through Syntactic Analysis},
author={Shahrour, Anas and Khalifa, Salam and Habash, Nizar},
booktitle={Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing},
pages={1309--1315},
url={https://www.aclweb.org/anthology/D15-1152.pdf},
year={2015}
}
%% catib citations
@article{marton2013dependency,
title={Dependency parsing of Modern Standard {A}rabic with lexical and inflectional features},
author={Marton, Yuval and Habash, Nizar and Rambow, Owen},
journal={Computational Linguistics},
volume={39},
number={1},
pages={161--194},
year={2013},
url={https://www.mitpressjournals.org/doi/full/10.1162/COLI_a_00138},
publisher={MIT Press}
}