diff --git a/corpora/literary-corpora/bdcamoes-corpus-part-I.json b/corpora/literary-corpora/bdcamoes-corpus-part-I.json new file mode 100644 index 0000000..b3544d6 --- /dev/null +++ b/corpora/literary-corpora/bdcamoes-corpus-part-I.json @@ -0,0 +1,15 @@ +{ + "Name": "BDCamões Corpus (Part I)", + "URL": "https://hdl.handle.net/21.11129/0000-000D-F89B-D", + "Family": "Literary corpora", + "Description": "This corpus contains texts from 83 authors in 14 genres, covering a time span from the 15th to the 21st century, and adhering to different orthographic conventions.\nThe corpus is available from PORTULAN.", + "Language": ["pt"], + "Licence": "CC-BY", + "Size": ["3.1 million words"], + "Annotation": ["", ""], + "Infrastructure": "CLARIN", + "Access": { + "Download": "https://hdl.handle.net/21.11129/0000-000D-F89B-D" + }, + "Publication":"" +} \ No newline at end of file diff --git a/corpora/literary-corpora/bdcamoes-corpus-part-II.json b/corpora/literary-corpora/bdcamoes-corpus-part-II.json new file mode 100644 index 0000000..eb55c53 --- /dev/null +++ b/corpora/literary-corpora/bdcamoes-corpus-part-II.json @@ -0,0 +1,15 @@ +{ + "Name": "BDCamões Corpus (Part II)", + "URL": "https://hdl.handle.net/21.11129/0000-000D-F8AB-B", + "Family": "Literary corpora", + "Description": "This corpus contains texts from 83 authors in 14 genres, covering a time span from the 15th to the 21st century, and adhering to different orthographic conventions.\nThe corpus is available from PORTULAN.", + "Language": ["pt"], + "Licence": "MS-NC-NoReD-ND", + "Size": ["823,957 words"], + "Annotation": ["", ""], + "Infrastructure": "CLARIN", + "Access": { + "Download": "https://hdl.handle.net/21.11129/0000-000D-F8AB-B" + }, + "Publication":"" +} \ No newline at end of file diff --git a/corpora/literary-corpora/digiliblt.json b/corpora/literary-corpora/digiliblt.json new file mode 100644 index 0000000..9ac4822 --- /dev/null +++ b/corpora/literary-corpora/digiliblt.json @@ -0,0 +1,15 @@ +{ + "Name": "digilibLT", + "URL": "https://hdl.handle.net/20.500.11752/OPEN-554", + "Family": "Literary corpora", + "Description": "This is a corpus of secular prose texts written in the late antiquity.\nThe corpus is available from the ILC4CLARIN repository.", + "Language": ["la"], + "Licence": "CC BY-NC-SA 4.0", + "Size": ["375 texts"], + "Annotation": ["", ""], + "Infrastructure": "CLARIN", + "Access": { + "Download": "http://hdl.handle.net/20.500.11752/OPEN-554" + }, + "Publication":"" +} \ No newline at end of file diff --git a/corpora/literary-corpora/musisque.json b/corpora/literary-corpora/musisque.json new file mode 100644 index 0000000..eb55c53 --- /dev/null +++ b/corpora/literary-corpora/musisque.json @@ -0,0 +1,15 @@ +{ + "Name": "BDCamões Corpus (Part II)", + "URL": "https://hdl.handle.net/21.11129/0000-000D-F8AB-B", + "Family": "Literary corpora", + "Description": "This corpus contains texts from 83 authors in 14 genres, covering a time span from the 15th to the 21st century, and adhering to different orthographic conventions.\nThe corpus is available from PORTULAN.", + "Language": ["pt"], + "Licence": "MS-NC-NoReD-ND", + "Size": ["823,957 words"], + "Annotation": ["", ""], + "Infrastructure": "CLARIN", + "Access": { + "Download": "https://hdl.handle.net/21.11129/0000-000D-F8AB-B" + }, + "Publication":"" +} \ No newline at end of file