diff --git a/examples/anonymise_submissions.py b/examples/anonymise_submissions.py new file mode 100644 index 0000000..218f232 --- /dev/null +++ b/examples/anonymise_submissions.py @@ -0,0 +1,24 @@ +# Make file with anonymised submissions to share with sister conferences +# (for dual-submission detection) +# Ulle Endriss, 14 April 2024 +import os + +from easychair_extra.read import read_submission + + +def main(): + current_dir = os.path.dirname(os.path.abspath(__file__)) + root_dir = os.path.join(current_dir, "..", "easychair_sample_files") + + # read submission and author files + submissions = read_submission( + os.path.join(root_dir, "submission.csv"), + remove_deleted=True + ) + + submissions["id"] = submissions["#"] + submissions.to_csv("anonymised_submissions.csv", sep=",", encoding="utf-8", columns=["id", "title", "abstract"], index=False) + + +if __name__ == "__main__": + main() diff --git a/examples/papers_with_same_authors.py b/examples/papers_with_same_authors.py index bc4ec78..c6758ca 100644 --- a/examples/papers_with_same_authors.py +++ b/examples/papers_with_same_authors.py @@ -2,7 +2,7 @@ import pandas as pd -from easychair_extra.read import read_submission, read_committee +from easychair_extra.read import read_submission def main(): diff --git a/examples/papers_with_short_abstracts.py b/examples/papers_with_short_abstracts.py new file mode 100644 index 0000000..b2b54b8 --- /dev/null +++ b/examples/papers_with_short_abstracts.py @@ -0,0 +1,24 @@ +# Help finding placeholder abstracts +# Ulle Endriss, 14 April 2024 +import os + +from easychair_extra.read import read_submission + + +def main(): + current_dir = os.path.dirname(os.path.abspath(__file__)) + root_dir = os.path.join(current_dir, "..", "easychair_sample_files") + + # read submission and author files + submissions = read_submission( + os.path.join(root_dir, "submission.csv"), + remove_deleted=True + ) + submissions["abstract_len"] = submissions.apply(lambda df_row: len(df_row["abstract"]), axis=1) + + submissions.to_csv("abstract.csv", sep=",", encoding="utf-8", columns=["#", "abstract_len", "abstract"], index=False) + + +if __name__ == "__main__": + main() + diff --git a/examples/plot_num_pc_per_area.py b/examples/plot_num_pc_per_area.py index 494fc8a..d8eae64 100644 --- a/examples/plot_num_pc_per_area.py +++ b/examples/plot_num_pc_per_area.py @@ -1,7 +1,5 @@ -import pathlib from collections import Counter, defaultdict -import csv import os.path import pandas as pd diff --git a/test/test_read.py b/test/test_read.py index c72740e..645597c 100644 --- a/test/test_read.py +++ b/test/test_read.py @@ -7,7 +7,7 @@ authors_as_list, author_list_to_str, read_topics, - read_committee, + read_committee, read_author, ) @@ -132,3 +132,9 @@ def test_read_committee(self): for arg in arguments: args[arg] = optional_arguments[arg] read_committee(os.path.join(root_dir, "committee.csv"), **args) + + def test_read_author(self): + current_dir = os.path.dirname(os.path.abspath(__file__)) + root_dir = os.path.join(current_dir, "..", "easychair_sample_files") + + read_author(os.path.join(root_dir, "author.csv"))