diff --git a/corpora/historical-corpora/CIPM.json b/corpora/historical-corpora/CIPM.json new file mode 100644 index 0000000..8261914 --- /dev/null +++ b/corpora/historical-corpora/CIPM.json @@ -0,0 +1,16 @@ +{ + "Name": "CIPM", + "URL": "https://hdl.handle.net/21.11129/0000-000D-F934-0", + "Family": "Historical corpora", + "Description": "This is a corpus of historical, religious, notarial, literary texts in prose and verse.\nThe corpus is available from PORTULAN.", + "Language": ["pt"], + "Licence": "CC-BY-NC-ND", + "Size": ["3.5 million words"], + "Annotation": ["", ""], + "Infrastructure": "CLARIN", + "Access": { + "Browse": "https://cipm.fcsh.unl.pt/", + "Download": "https://hdl.handle.net/21.11129/0000-000D-F934-0" + }, + "Publication":"" +} \ No newline at end of file diff --git a/corpora/historical-corpora/corpus-oudnederlands.json b/corpora/historical-corpora/corpus-oudnederlands.json new file mode 100644 index 0000000..4e5723f --- /dev/null +++ b/corpora/historical-corpora/corpus-oudnederlands.json @@ -0,0 +1,15 @@ +{ + "Name": "Corpus Oudnederlands (Corpus Old Dutch)", + "URL": "http://hdl.handle.net/10032/tm-a2-u6", + "Family": "", + "Description": "This is a corpus of all remaining Dutch word material from the year 475 to 1200 that served as the source material for the Oudnederlands Woordenboek (Dictionary of Old Dutch).\nThe corpus is available via the Dutch Language Institute.", + "Language": ["nl"], + "Licence": "", + "Size": [""], + "Annotation": ["", ""], + "Infrastructure": "CLARN", + "Access": { + "Browse": "https://corpusoudnederlands.ivdnt.org/corpus-frontend/ONL/search/" + }, + "Publication":"" +} \ No newline at end of file diff --git a/corpora/historical-corpora/couranten-corpus.json b/corpora/historical-corpora/couranten-corpus.json new file mode 100644 index 0000000..34e7503 --- /dev/null +++ b/corpora/historical-corpora/couranten-corpus.json @@ -0,0 +1,15 @@ +{ + "Name": "Couranten Corpus ", + "URL": "http://hdl.handle.net/10032/tm-a2-u9", + "Family": "Historical corpora", + "Description": "This is a corpus of 17th-century Dutch newspapers.\nThe corpus is available from the Dutch Language Institute.", + "Language": ["nl"], + "Licence": "", + "Size": [""], + "Annotation": ["", ""], + "Infrastructure": "CLARIN", + "Access": { + "Browse": "https://couranten.ivdnt.org/corpus-frontend/couranten/search/" + }, + "Publication":"" +} \ No newline at end of file diff --git a/corpora/historical-corpora/gekaapte-brieven.json b/corpora/historical-corpora/gekaapte-brieven.json new file mode 100644 index 0000000..4764215 --- /dev/null +++ b/corpora/historical-corpora/gekaapte-brieven.json @@ -0,0 +1,15 @@ +{ + "Name": "Gekaapte Brieven", + "URL": "http://hdl.handle.net/10032/tm-a2-x3", + "Family": "Historical corpora", + "Description": "This is a corpus of letters and other documents from the 17th and 18th centuries.\nThese letters and documents were present on Dutch ships hijacked by the English during one of the four wars fought between Britain and the Republic of the Seven United Netherlands during this period.\nThe corpus is available from the Dutch Language Institute.", + "Language": ["nl"], + "Licence": "", + "Size": [""], + "Annotation": ["", ""], + "Infrastructure": "CLARIN", + "Access": { + "Browse": "http://gekaaptebrieven.ivdnt.org/" + }, + "Publication":"" +} \ No newline at end of file diff --git a/corpora/historical-corpora/portuguese-parish-memories.json b/corpora/historical-corpora/portuguese-parish-memories.json new file mode 100644 index 0000000..6f45fa1 --- /dev/null +++ b/corpora/historical-corpora/portuguese-parish-memories.json @@ -0,0 +1,15 @@ +{ + "Name": "Portuguese Parish Memories (1758)", + "URL": "https://hdl.handle.net/21.11129/0000-000D-F8CE-4", + "Family": "Historical corpora", + "Description": "This is a corpus of historical surveys from the 18th century.\nThe corpus is available from PORTULAN.", + "Language": ["pt"], + "Licence": "CC BY", + "Size": [""], + "Annotation": ["", ""], + "Infrastructure": "CLARIN", + "Access": { + "Download": "https://hdl.handle.net/21.11129/0000-000D-F8CE-4" + }, + "Publication":"" +} \ No newline at end of file