-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathbibliography.bib
executable file
·877 lines (777 loc) · 30.6 KB
/
bibliography.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
@inproceedings{ahmadi2024cordi,
title = "Language and Speech Technology for {Central Kurdish} Varieties",
author = "Ahmadi, Sina and Q. Jaff, Daban and Ibn Alam, Md Mahfuz and Anastasopoulos, Antonios",
booktitle = "Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)",
month = may,
year = "2024",
address = "Torino, Italy",
publisher = "ELRA Language Resources Association"
}
@inproceedings{delgado2024kaset,
author = {Delgado, Dana and Walker, Kevin and Strassel, Stephanie and Graff, David and Caruso, Christopher},
title = {{KASET - Kurmanji and Sorani Kurdish Speech and Transcripts}},
booktitle = {LDC2024S01 Documents},
publisher = {{Philadelphia: Linguistic Data Consortium}},
year = {2024},
url = {https://doi.org/10.35111/576n-ye16}
}
@inproceedings{ahmadi2023script,
title = "Script Normalization for Unconventional Writing of Under-Resourced Languages in Bilingual Communities",
author = "Ahmadi, Sina and
Anastasopoulos, Antonios",
editor = "Rogers, Anna and
Boyd-Graber, Jordan and
Okazaki, Naoaki",
booktitle = "Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.acl-long.809",
doi = "10.18653/v1/2023.acl-long.809",
pages = "14466--14487"
}
@article{alam2023codet,
title={{CODET}: A Benchmark for Contrastive Dialectal Evaluation of Machine Translation},
author={Alam, Md Mahfuz Ibn and Ahmadi, Sina and Anastasopoulos, Antonios},
journal={arXiv preprint arXiv:2305.17267},
year={2023}
}
@inproceedings{ahmadi2023revisiting,
title = "Revisiting and Amending {C}entral {K}urdish Data on {U}ni{M}orph 4.0",
author = "Ahmadi, Sina and
Mahmudi, Aso",
editor = {Nicolai, Garrett and
Chodroff, Eleanor and
Mailhot, Frederic and
{\c{C}}{\"o}ltekin, {\c{C}}a{\u{g}}r{\i}},
booktitle = "Proceedings of the 20th SIGMORPHON workshop on Computational Research in Phonetics, Phonology, and Morphology",
month = jul,
year = "2023",
address = "Toronto, Canada",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.sigmorphon-1.5",
doi = "10.18653/v1/2023.sigmorphon-1.5",
pages = "38--48"
}
@inproceedings{ahmadi2023fieldmatters,
title = "Approaches to Corpus Creation for Low-Resource Language Technology: the Case of {Southern Kurdish and Laki}",
author = "Ahmadi, Sina and Azin, Zahra and Belelli, Sara and Anastasopoulos, Antonios",
booktitle = "Proceedings of the second workshop on NLP applications to field linguistics",
month = may,
year = "2023",
address = "Dubrovnik, Croatia",
publisher = "The 17th Conference of the European Chapter of the Association for Computational Linguistics"
}
@inproceedings{ahmadi2023pali,
title = "{PALI}: A Language Identification Benchmark for {Perso-Arabic} Scripts",
author = "Ahmadi, Sina and Agarwal, Milind and Anastasopoulos, Antonios",
booktitle = "Proceedings of the 10th Workshop on NLP for Similar Languages, Varieties and Dialects (VarDial)",
month = may,
year = "2023",
address = "Dubrovnik, Croatia",
publisher = "The 17th Conference of the European Chapter of the Association for Computational Linguistics"
}
@article{hameed2023sentiment,
author = {Hameed, Razhan and Ahmadi, Sina and Daneshfar, Fatemeh},
title = {Transfer Learning for Low-Resource Sentiment Analysis},
year = {2023},
publisher = {Association for Computing Machinery},
abstract = {Sentiment analysis is the process of identifying and extracting subjective information from text. Despite the advances to employ cross-lingual approaches in an automatic way, the implementation and evaluation of sentiment analysis systems require language-specific data to consider various sociocultural and linguistic peculiarities. In this paper, the collection and annotation of a dataset are described for sentiment analysis of Central Kurdish. We explore a few classical machine learning and neural network-based techniques for this task. Additionally, we employ an approach in transfer learning to leverage pretrained models for data augmentation. We demonstrate that data augmentation achieves a high F1 score and accuracy despite the difficulty of the task.},
note = {Under review},
journal = {ACM Trans. Asian Low-Resour. Lang. Inf. Process.}
}
@article{abdullah2022,
author = {Abdullah, Abdulhady and Veisi, Hadi},
year = {2022},
month = {12},
pages = {108-118},
title = {Central Kurdish Automatic Speech Recognition using Deep Learning},
volume = {16},
journal = {Journal of University of Anbar for Pure Science},
doi = {10.37652/juaps.2022.176500}
}
@article{awlla2022,
author = {Awlla, Kozhin and Veisi, Hadi},
year = {2022},
month = {12},
pages = {119-130},
title = {Central Kurdish Sentiment Analysis Using Deep Learning},
volume = {16},
journal = {Journal of University of Anbar for Pure Science},
doi = {10.37652/juaps.2022.176501}
}
@article{amin2022kurdish,
title={Kurdish Language Sentiment Analysis: Problems and Challenges},
author={Amin, Miran Hama Saeed Mohammed and Al-Rassam, Omar and Faeq, Zhenar Shaho},
journal={Mathematical Statistician and Engineering Applications},
volume={71},
number={4},
pages={3282--3293},
year={2022}
}
@misc{zuhair2021,
doi = {10.48550/ARXIV.2111.11063},
url = {https://arxiv.org/abs/2111.11063},
author = {Zuhair, Aza and Hassani, Hossein},
publisher = {arXiv},
year = {2021},
copyright = {Creative Commons Attribution 4.0 International}
}
@article{kamala2022kurdish,
title={Kurdish Music Genre Recognition Using CNN and DNN},
author={Kamala, Aza and Hassani, Hossein},
year={2022},
publisher={MDPI}
}
@article{ahmadi2021ickl,
title={{On the Current State of Kurdish Language Processing}},
author={Ahmadi, Sina},
journal={Proceedings of the 5th International Conference on Kurdish Linguistics (ICKL-5) Conference},
address = {Graz, Austria},
year={2021}
}
@Article{app11209752,
AUTHOR = {Idrees, Saman and Hassani, Hossein},
TITLE = {Exploiting Script Similarities to Compensate for the Large Amount of Data in Training Tesseract LSTM: Towards Kurdish OCR},
JOURNAL = {Applied Sciences},
VOLUME = {11},
YEAR = {2021},
NUMBER = {20},
ARTICLE-NUMBER = {9752},
URL = {https://www.mdpi.com/2076-3417/11/20/9752},
ISSN = {2076-3417},
DOI = {10.3390/app11209752}
}
@article{azin2021sk,
title={{Creating an Electronic Lexicon for the Under-resourced Southern Varieties of Kurdish Language}},
author={Azin, Zahra and Ahmadi, Sina},
journal={Proceedings of Seventh Biennial Conference on Electronic Lexicography (eLex 2021)},
address = "online",
year={2021}
}
@inproceedings{abdulrahman2022lmspell,
title = "A Language Model for Spell Checking of Educational Texts in Kurdish (Sorani)",
author = "Abdulrahman, Roshna Omer and Hassani, Hossein",
booktitle = "Proceedings of SIGUL2022 LREC2022",
month = june,
year = "2022",
address = "Marseille, France",
publisher = "European Language Resources Association (ELRA)",
url = "http://www.lrec-conf.org/proceedings/lrec2022/workshops/SIGUL/pdf/2022.sigul-1.25.pdf"
}
@article{ahmadi2020Hunspell,
title={{Hunspell for Sorani Kurdish Spell Checking and Morphological Analysis}},
author={Ahmadi, Sina},
journal={arXiv preprint arXiv:2109.06374},
year={2021},
}
@misc{naserzade2021ckmorph,
title={CKMorph: A Comprehensive Morphological Analyzer for Central Kurdish},
author={Morteza Naserzade and Aso Mahmudi and Hadi Veisi and Hawre Hosseini and Mohammad MohammadAmini},
year={2021},
eprint={2109.08615},
archivePrefix={arXiv},
primaryClass={cs.CL}
}
@article{ahmadi2021modelling,
title={{A Formal Description of Sorani Kurdish Morphology}},
author={Ahmadi, Sina},
journal={arXiv preprint arXiv:2109.03942},
year={2021}
}
@article{de2021multilingual,
title={Multilingual Autoregressive Entity Linking},
author={De Cao, Nicola and Wu, Ledell and Popat, Kashyap and Artetxe, Mikel and Goyal, Naman and Plekhanov, Mikhail and Zettlemoyer, Luke and Cancedda, Nicola and Riedel, Sebastian and Petroni, Fabio},
journal={arXiv preprint arXiv:2103.12528},
year={2021}
}
@inproceedings{ahmadi-2020-building,
title = "Building a Corpus for the {Z}aza{--}Gorani Language Family",
author = "Ahmadi, Sina",
booktitle = "Proceedings of the 7th Workshop on NLP for Similar Languages, Varieties and Dialects",
month = dec,
year = "2020",
address = "Barcelona, Spain (Online)",
publisher = "International Committee on Computational Linguistics (ICCL)",
url = "https://www.aclweb.org/anthology/2020.vardial-1.7",
pages = "70--78"
}
@misc{veisi2021jira,
title={Jira: a Kurdish Speech Recognition System Designing and Building Speech Corpus and Pronunciation Lexicon},
author={Hadi Veisi and Hawre Hosseini and Mohammad Mohammadamini and Wirya Fathy and Aso Mahmudi},
year={2021},
eprint={2102.07412},
archivePrefix={arXiv},
primaryClass={cs.AI}
}
@inproceedings{ahmadi-2020-tokenization,
title = "A Tokenization System for the {K}urdish Language",
author = "Ahmadi, Sina",
booktitle = "Proceedings of the 7th Workshop on NLP for Similar Languages, Varieties and Dialects",
month = dec,
year = "2020",
address = "Barcelona, Spain (Online)",
publisher = "International Committee on Computational Linguistics (ICCL)",
url = "https://www.aclweb.org/anthology/2020.vardial-1.11",
pages = "114--127"
}
@inproceedings{ahmadi-2020-klpt,
title = "{KLPT} {--} {K}urdish Language Processing Toolkit",
author = "Ahmadi, Sina",
booktitle = "Proceedings of Second Workshop for NLP Open Source Software (NLP-OSS)",
month = nov,
year = "2020",
address = "Online",
publisher = "Association for Computational Linguistics",
url = "https://www.aclweb.org/anthology/2020.nlposs-1.11",
doi = "10.18653/v1/2020.nlposs-1.11",
pages = "72--84"
}
@misc{mahmudi2021automatic,
title={Automatic Meter Classification of Kurdish Poems},
author={Aso Mahmudi and Hadi Veisi},
year={2021},
eprint={2102.12109},
archivePrefix={arXiv},
primaryClass={cs.CL}
}
@inproceedings{ahmadi2020machine,
title = "Towards Machine Translation for the {K}urdish Language",
author = "Ahmadi, Sina and
Masoud, Maraim",
booktitle = "Proceedings of the 3rd Workshop on Technologies for MT of Low Resource Languages",
month = dec,
year = "2020",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://www.aclweb.org/anthology/2020.loresmt-1.12",
pages = "87--98"
}
@article{ahmadi2022leveraging,
author = {Ahmadi, Sina and Hassani, Hossein and Jaff, Daban Q.},
title = {Leveraging Multilingual News Websites for Building a Kurdish Parallel Corpus},
year = {2022},
issue_date = {September 2022},
publisher = {Association for Computing Machinery},
address = {New York, NY, USA},
volume = {21},
number = {5},
issn = {2375-4699},
url = {https://doi.org/10.1145/3511806},
doi = {10.1145/3511806},
month = {apr},
articleno = {99},
numpages = {11},
keywords = {Parallel corpus, natural language processing, Kurdish, machine translation, less-resourced languages}
}
@inproceedings{mohammed2012automatic,
title={Automatic {K}urdish {S}orani text categorization using N-gram based model},
author={Mohammed, FS and Zakaria, L and Omar, Nazlia and Albared, MY},
booktitle={Computer \& Information Science (ICCIS), 2012 International Conference on},
volume={1},
pages={392--395},
year={2012},
organization={IEEE}
}
@inproceedings{esmaili2013sorani,
title={Sorani Kurdish versus Kurmanji Kurdish: An Empirical Comparison},
author={Esmaili, Kyumars Sheykh and Salavati, Shahin},
booktitle={Proceedings of the 51st Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)},
volume={2},
pages={300--305},
year={2013}
}
@article{hassani2016automatic,
title={Automatic {K}urdish dialects identification},
author={Hassani, Hossein and Medjedovic, Dzejla},
journal={Computer Science \& Information Technology},
volume={6},
number={2},
pages={61--78},
year={2016}
}
@inproceedings{malmasi2016subdialectal,
title={Subdialectal differences in {S}orani {K}urdish},
author={Malmasi, Shervin},
booktitle={Proceedings of the third workshop on nlp for similar languages, varieties and dialects (vardial3)},
pages={89--96},
year={2016}
}
@article{al2017kurdish,
title={{K}urdish Dialects and Neighbor Languages Automatic Recognition},
author={Al-Talabani, Abdulbasit and Abdul, Zrar and Ameen, Azad},
journal={ARO-The Scientific Journal of Koya University},
volume={5},
number={1},
pages={20--23},
year={2017},
publisher={Koya University}
}
@inproceedings{littell2016named,
title={Named entity recognition for linguistic rapid response in low-resource languages: {S}orani {K}urdish and {T}ajik},
author={Littell, Patrick and Goyal, Kartik and Mortensen, David R and Little, Alexa and Dyer, Chris and Levin, Lori},
booktitle={Proceedings of COLING 2016, the 26th International Conference on Computational Linguistics: Technical Papers},
pages={998--1006},
year={2016}
}
@inproceedings{hassani2017method,
title={A Method for Proper Noun Extraction in {K}urdish},
author={Hassani, Hossein},
booktitle={OASIcs-OpenAccess Series in Informatics},
volume={56},
year={2017},
organization={Schloss Dagstuhl-Leibniz-Zentrum fuer Informatik}
}
@article{esmaili2012challenges,
title={Challenges in {K}urdish text processing},
author={Esmaili, Kyumars Sheykh},
journal={arXiv preprint arXiv:1212.0074},
year={2012}
}
@article{esmaAl-Talabaniili2014towards,
title={Towards {K}urdish information retrieval},
author={Esmaili, Kyumars Sheykh and Salavati, Shahin and Datta, Anwitaman},
journal={ACM Transactions on Asian Language Information Processing (TALIP)},
volume={13},
number={2},
pages={7},
year={2014},
publisher={ACM}
}
@inproceedings{jaf2016simple,
title={{A simple approach to unify ambiguously encoded {K}urdish characters}},
author={Jaf, Sardar},
booktitle={Proceedings of the International Conference Computational Linguistics in Bulgaria (CLIB 2016).},
pages={86--94},
year={2016},
organization={Institute for Bulgarian Language, Bulgarian Academy of Sciences}
}
@article{rashid2017robust,
title={{A robust categorization system for {K}urdish Sorani text documents}},
author={Rashid, Tarik A and Mustafa, Arazo M and Saeed, A},
journal={Inf. Technol. J},
volume={16},
number={1},
pages={27--34},
year={2017}
}
@article{ahmadi2019wergor,
title={{A Rule-based {K}urdish Text Transliteration System}},
author={Ahmadi, Sina},
journal={Asian and Low-Resource Language Information Processing (TALLIP)},
volume={18},
number={2},
pages={18:1--18:8},
year={2019}
}
@inproceedings{rashid2017automatic,
title={Automatic {K}urdish Text Classification Using KDC 4007 Dataset},
author={Rashid, Tarik A and Mustafa, Arazo M and Saeed, Ari M},
booktitle={International Conference on Emerging Internetworking, Data \& Web Technologies},
pages={187--198},
year={2017},
organization={Springer}
}
@inproceedings{daneshfar2009implementation,
title={{Implementation of a Text-to-Speech System for Kurdish Language}},
author={Daneshfar, Fatemeh and Barkhoda, Wafa and Azami, Bahram Zahir},
booktitle={Digital Telecommunications, 2009. ICDT'09. Fourth International Conference on},
pages={117--120},
year={2009},
organization={IEEE}
}
@inproceedings{barkhoda2009comparison,
title={{A comparison between allophone, syllable, and diphone based TTS systems for {K}urdish language}},
author={Barkhoda, Wafa and ZahirAzami, Bahram and Bahrampour, Anvar and Shahryari, Om-Kolsoom},
booktitle={Signal Processing and Information Technology (ISSPIT), 2009 IEEE International Symposium on},
pages={557--562},
year={2009},
organization={IEEE}
}
@article{hassani2011kurdish,
title={{K}urdish text to speech (KTTS)},
author={Hassani, Hossein and Kareem, Rahel},
journal={Designing for Global Markets},
volume={10},
pages={79--89},
year={2011}
}
@inproceedings{bahrampour2009implementation,
title={{Implementation of three text to speech systems for {K}urdish language}},
author={Bahrampour, Anvar and Barkhoda, Wafa and Azami, Bahram Zahir},
booktitle={Iberoamerican Congress on Pattern Recognition},
pages={321--328},
year={2009},
organization={Springer}
}
@inproceedings{dinler2017formant,
title={Formant analysis of vowels in {K}urdish language},
author={D{\.i}nler, {\"O}zlem Batur and Karab{\i}ber, Fatih},
booktitle={Signal Processing and Communications Applications Conference (SIU), 2017 25th},
pages={1--4},
year={2017},
organization={IEEE}
}
@article{dinler2018extraction,
title={Extraction Of The Acoustic Features Of Semi-vowels In the {K}urdish Language},
author={D{\.i}nler, {\"O}zlem Batur and Aydin, Nizamettin},
journal={The Online Journal of Science and Technology-April},
volume={8},
number={2},
year={2018}
}
@inproceedings{hassani2017kurdish,
title={{K}urdish interdialect machine translation},
author={Hassani, Hossein},
booktitle={Proceedings of the fourth workshop on NLP for similar languages, varieties and dialects (VarDial)},
pages={63--72},
year={2017}
}
@article{kaka2018english,
title={{English to {K}urdish Rule-based Machine Translation System}},
author={Kaka-Khan, Kanaan M},
journal={UHD Journal of Science and Technology},
year={2018}
}
@article{saeed2018improving,
title={{Improving {K}urdish Web Mining through Tree Data Structure and Porter’s Stemmer Algorithms}},
author={Saeed, Ari M and Rashid, Tarik A and Mustafa, Arazo M and Fattah, Polla and Ismael, Birzo},
journal={UKH Journal of Science and Engineering},
volume={2},
number={1},
pages={48--54},
year={2018}
}
@inproceedings{salavati2013stemming,
title={{Stemming for {K}urdish information retrieval}},
author={Salavati, Shahin and Esmaili, Kyumars Sheykh and Akhlaghian, Fardin},
booktitle={Asia Information Retrieval Symposium},
pages={272--283},
year={2013},
organization={Springer}
}
@inproceedings{gokirmak2017dependency,
title={A dependency treebank for {K}urmanji {K}urdish},
author={G{\"o}k{\i}rmak, Memduh and Tyers, Francis M},
booktitle={Proceedings of the Fourth International Conference on Dependency Linguistics (Depling 2017)},
pages={64--72},
year={2017}
}
@inproceedings{salavati2018building,
title={{Building a Lemmatizer and a Spell-checker for Sorani Kurdish}},
author={Salavati, Shahin and Ahmadi, Sina},
booktitle={Proceedings of the 8th Language \& Technology Conference: Human Language Technologies as a Challenge for Computer Science and Linguistics},
address = "Poznan, Poland",
year={2018}
}
@inproceedings{walther2010developing,
title={Developing a large-scale lexicon for a less-resourced language: General methodology and preliminary experiments on {S}orani {K}urdish},
author={Walther, G{\'e}raldine and Sagot, Beno{\^\i}t},
booktitle={Proceedings of the 7th SaLTMiL Workshop on Creation and use of basic lexical resources for less-resourced languages (LREC 2010 Workshop)},
year={2010}
}
@inproceedings{walther2010fast,
title={Fast Development of Basic NLP Tools: Towards a Lexicon and a POS Tagger for {K}urmanji {K}urdish},
author={Walther, G{\'e}raldine and Sagot, Beno{\^\i}t and Fort, Kar{\"e}n},
booktitle={International conference on lexis and grammar},
pages={0},
year={2010}
}
@inproceedings{walther2012fitting,
title={Fitting into morphological structure: accounting for Sorani Kurdish endoclitics},
author={Walther, G{\'e}raldine},
booktitle={Mediterranean Morphology Meetings},
volume={8},
pages={299--321},
year={2012},
note = "[Online; accessed 19-Mar-2019]",
howpublished = "\url{http://www.lilec.it/mmm/wp/wp-content/uploads/2013/09/299-321-Walther.pdf}"
}
@inproceedings{jaf2014stemmer,
title={{A Stemmer and a POS tagger for {S}orani {K}urdish}},
author={Jaf, Sardar and Ramsay, Allan},
booktitle={6th International Conference on Corpus Linguistics (CILC-14)},
year={2014},
organization={Gran Canaria, Spain, Cambridge Scholars}
}
@article{mustafa2018kurdish,
title={{K}urdish stemmer pre-processing steps for improving information retrieval},
author={Mustafa, Arazo M and Rashid, Tarik A},
journal={Journal of Information Science},
volume={44},
number={1},
pages={15--27},
year={2018},
publisher={SAGE Publications Sage UK: London, England}
}
@inproceedings{esmaili2013building,
title={Building a test collection for {S}orani {K}urdish},
author={Esmaili, Kyumars Sheykh and Eliassi, Donya and Salavati, Shahin and Aliabadi, Purya and Mohammadi, Asrin and Yosefi, Somayeh and Hakimi, Shownem},
booktitle={Computer Systems and Applications (AICCSA), 2013 ACS International Conference on},
pages={1--7},
year={2013},
organization={IEEE}
}
@inproceedings{aliabadi2014towards,
title={Towards building kurdnet, the {K}urdish {W}ordnet},
author={Aliabadi, Purya and Ahmadi, Mohammad Sina and Salavati, Shahin and Esmaili, Kyumars Sheykh},
booktitle={Proceedings of the Seventh Global Wordnet Conference},
pages={1--6},
year={2014}
}
@inproceedings{aliabadi2014semi,
title={Semi-Automatic Development of {K}urd{N}et, The {K}urdish {W}ordNet},
author={Aliabadi, Purya},
booktitle={Proceedings of the ACL 2014 Student Research Workshop},
pages={94--99},
year={2014}
}
@article{veisi2020toward,
title={Toward Kurdish language processing: Experiments in collecting and processing the AsoSoft text corpus},
author={Veisi, Hadi and MohammadAmini, Mohammad and Hosseini, Hawre},
journal={Digital Scholarship in the Humanities},
volume={35},
number={1},
pages={176--193},
year={2020},
publisher={Oxford University Press}
}
@article{hassani2016automatic,
title={Automatic {K}urdish dialects identification},
author={Hassani, Hossein and Medjedovic, Dzejla},
journal={Computer Science \& Information Technology},
volume={6},
number={2},
pages={61--78},
year={2016}
}
@inproceedings{malmasi2016subdialectal,
title={Subdialectal differences in {S}orani {K}urdish},
author={Malmasi, Shervin},
booktitle={Proceedings of the third workshop on nlp for similar languages, varieties and dialects (vardial3)},
pages={89--96},
year={2016}
}
@inproceedings{mohammed2012automatic,
title={Automatic {K}urdish {S}orani text categorization using N-gram based model},
author={Mohammed, FS and Zakaria, L and Omar, Nazlia and Albared, MY},
booktitle={Computer \& Information Science (ICCIS), 2012 International Conference on},
volume={1},
pages={392--395},
year={2012},
organization={IEEE}
}
@article{hassani2018blark,
title={{BLARK for multi-dialect languages: towards the Kurdish BLARK}},
author={Hassani, Hossein},
journal={Language Resources and Evaluation},
volume={52},
number={2},
pages={625--644},
year={2018},
publisher={Springer}
}
@article{yaseen2018kurdish,
title={{K}urdish Optical Character Recognition},
author={Yaseen, Rasty and Hassani, Hossein},
journal={UKH Journal of Science and Engineering},
volume={2},
number={1},
pages={18--27},
year={2018}
}
@article{mohammed2013handwritten,
title={Handwritten {K}urdish character recognition using geometric discertization feature},
author={Mohammed, Bayan Omar},
journal={Volume},
volume={4},
pages={51--55},
year={2013}
}
@article{dinler2018kurdish,
title={{K}urdish Recognition System Digit},
author={D{\.i}nler, {\"O}zlem Batur and Aydin, Nizamettin},
journal={The Online Journal of Science and Technology},
volume={8},
number={1},
pages={101},
year={2018}
}
@article{mohammed2012uniqueness,
title={Uniqueness in {K}urdish handwriting},
author={Mohammed, Bayan Omar},
journal={International Journal of Engineering \& Computer Science IJECS-IJENS},
volume={12},
number={06},
pages={42--50},
year={2012}
}
@article{zarro2017recognition,
title={Recognition-based online {K}urdish character recognition using hidden {M}arkov model and harmony search},
author={Zarro, Rina D and Anwer, Mardin A},
journal={Engineering Science and Technology, an International Journal},
volume={20},
number={2},
pages={783--794},
year={2017},
publisher={Elsevier}
}
@article{shaltookisentiment,
title={Sentiment Analyses for {K}urdish Social Network Texts using {N}aive {B}ayes Classifier},
author={Shaltooki, Abdusalam Abdulla and Hama, Mzhda Hiwa},
journal={Journal of Human Development},
volume={1},
number={4},
pages={393--397},
year={2016}
}
@article{hashim2018kurdish,
title={{K}urdish Sign Language Recognition System},
author={Hashim, Abdulla D and Alizadeh, Fattah},
journal={UKH Journal of Science and Engineering},
volume={2},
number={1},
pages={1--6},
year={2018}
}
@article{kaka2017building,
title={Building {K}urdish Chatbot Using Free Open Source Platforms},
author={Kaka-Khan, Kanaan M},
journal={UHD Journal of Science and Technology},
volume={1},
number={2},
pages={46--50},
year={2017}
}
@article{gautier1998building,
title={Building a {K}urdish Language Corpus: An Overview of the Technical Problems},
author={Gautier, G{\'e}rard},
journal={Proceedings of ICEMCO},
year={1998}
}
@article{kakaevaluation,
title={Evaluation of inkurdish Machine Translation System},
author={Kaka-Khan, Kanaan M and Taher, Fatima Jalal},
journal={{UHD Journal of Science and Technology}},
volume={3},
number={2},
pages={862--868},
year={2017}
}
@inproceedings{ahmadi2020tokenization,
title={{A Tokenization System for the Kurdish Language}},
author={Ahmadi, Sina},
year={2020},
booktitle={the Proceedings of the Seventh Workshop on NLP for Similar Languages, Varieties and Dialects (VarDial 2020)},
}
@inproceedings{ahmadi2020Hunspell,
title={{Hunspell for Sorani Kurdish Spell-checking and Morphological Analysis}},
author={Ahmadi, Sina},
year={2020},
publisher={under review}
}
@inproceedings{ahmadi2020lemmatization,
title={{A Lemmatization System for Sorani Kurdish}},
author={Ahmadi, Sina},
year={2020},
publisher={under review}
}
@article{ahmadi2020towards,
title={{Towards Finite-State Morphology of Kurdish}},
author={Ahmadi, Sina and Hassani, Hossein},
journal={arXiv preprint arXiv:2005.10652},
year={2020}
}
@inproceedings{ahmadi2020corpus,
title={{A corpus of the Sorani Kurdish folkloric lyrics}},
author={Ahmadi, Sina and Hassani, Hossein and Abedi, Kamaladdin},
booktitle={Proceedings of the 1st Joint Spoken Language Technologies for Under-resourced languages (SLTU) and Collaboration and Computing for Under-Resourced Languages (CCURL) Workshop at the 12th International Conference on Language Resources and Evaluation (LREC)},
year={2020}
}
@inproceedings{ahmadi2019towards,
title={{Towards electronic lexicography for the Kurdish language}},
author={Ahmadi, Sina and Hassani, Hossein and McCrae, John P},
booktitle={Proceedings of the sixth biennial conference on electronic lexicography (eLex)},
year={2019},
organization={eLex 2019}
}
@inproceedings{abdulrahman2019developing,
title={{Developing a Fine-grained Corpus for a Less-resourced Language: the case of Kurdish}},
author={Abdulrahman, Roshna and Hassani, Hossein and Ahmadi, Sina},
booktitle={Proceedings of the 2019 Workshop on Widening NLP},
pages={106--109},
year={2019}
}
@inproceedings{kamal-hassani-2020-towards,
title = "Towards {K}urdish Text to Sign Translation",
author = "Kamal, Zina and
Hassani, Hossein",
booktitle = "Proceedings of the LREC2020 9th Workshop on the Representation and Processing of Sign Languages: Sign Language Resources in the Service of the Language Community, Technological Challenges and Application Perspectives",
month = may,
year = "2020",
address = "Marseille, France",
publisher = "European Language Resources Association (ELRA)",
url = "https://www.aclweb.org/anthology/2020.signlang-1.19",
pages = "117--122"
}
@article{abdulrahman2020using,
title={{Using Punkt for Sentence Segmentation in non-Latin Scripts: Experiments on Kurdish (Sorani) Texts}},
author={Abdulrahman, Roshna Omer and Hassani, Hossein},
journal={arXiv preprint arXiv:2004.14134},
year={2020}
}
@article{saeed2018evaluation,
title={{An evaluation of Reber stemmer with longest match stemmer technique in Kurdish Sorani text classification}},
author={Saeed, Ari M and Rashid, Tarik A and Mustafa, Arazo M and Agha, Rawan A Al-Rashid and Shamsaldin, Ahmed S and Al-Salihi, Nawzad K},
journal={Iran Journal of Computer Science},
volume={1},
number={2},
pages={99--107},
year={2018},
publisher={Springer}
}
@article{mahmudi2021automated,
title={Automated Grapheme-to-Phoneme Conversion for Central Kurdish based on Optimality Theory},
author={Mahmudi, Aso and Veisi, Hadi},
journal={Computer Speech \& Language},
pages={101222},
year={2021},
publisher={Elsevier}
}
@article{baban1995programmable,
title={Programmable Grammar of the Kurdish Language},
author={Baban, ST and Husein, S},
year={1995},
journal={ILLC Research Report and Technical Notes}
}
@article{goyal2021flores,
title={{The FLORES-101 Evaluation Benchmark for Low-Resource and Multilingual Machine Translation}},
author={Goyal, Naman and Gao, Cynthia and Chaudhary, Vishrav and Chen, Peng-Jen and Wenzek, Guillaume and Ju, Da and Krishnan, Sanjana and Ranzato, Marc'Aurelio and Guzman, Francisco and Fan, Angela},
journal={arXiv preprint arXiv:2106.03193},
year={2021}
}
@article{ataman2018bianet,
title={Bianet: A parallel news corpus in turkish, kurdish and english},
author={Ataman, Duygu},
journal={arXiv preprint arXiv:1805.05095},
year={2018}
}
@article{amini2021central,
title={{Central Kurdish machine translation: First large scale parallel corpus and experiments}},
author={Amini, Zhila and Mohammadamini, Mohammad and Hosseini, Hawre and Mansouri, Mehran and Jaff, Daban},
journal={arXiv preprint arXiv:2106.09325},
year={2021}
}
@unpublished{amani:hal-03262435,
TITLE = {{Kurdish spoken dialect recognition using x-vector speaker embeddings}},
AUTHOR = {Amani, Arash and Mohammadamini, Mohammad and Veisi, Hadi},
URL = {https://hal.archives-ouvertes.fr/hal-03262435},
NOTE = {working paper or preprint},
YEAR = {2021},
MONTH = Jun,
KEYWORDS = {Speaker embeddings ; x-vector ; Kurdish language ; dialect recognition ; Zar dataset ; Speaker embeddings},
PDF = {https://hal.archives-ouvertes.fr/hal-03262435/file/Kurdish%20spoken%20dialect%20recognition.pdf},
HAL_ID = {hal-03262435},
HAL_VERSION = {v1},
}