Skip to content

Commit

Permalink
Version updates
Browse files Browse the repository at this point in the history
  • Loading branch information
dthoward96 committed Feb 23, 2024
1 parent 6d76293 commit 573e1a6
Show file tree
Hide file tree
Showing 93 changed files with 20,368 additions and 227 deletions.
35 changes: 35 additions & 0 deletions OTHER_species/config.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,35 @@
Submission:
NCBI:
Username: username
Password: password
Table2asn: True
Submission_Position: 1
Description:
Title: test_submission
Comment: This is a test submission
Organization:
'@role': owner
'@type': institute
'@org_id': 12345
Name: CDC
Address:
Affil: Centers for Disease Control and Prevention
Div: Respiratory Viruses Branch, Division of Viral Diseases
Street: 1600 Clifton Rd
City: Atlanta
Sub: GA
Postal_code: 30329
Country: USA
Email: [email protected]
Phone: ""
Submitter:
'@email': [email protected]
'@alt_email':
Name:
First: Jane
Last: Doe
GISAID:
Client-Id: TEST-EA76875B00C3
Username: username
Password: password
Submission_Position: 2
3 changes: 3 additions & 0 deletions OTHER_species/metadata.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
ncbi-spuid,ncbi-spuid_namespace,bs-description,organism,ncbi-bioproject,bs-isolate,bs-collected_by,bs-package, bs-collection_date, bs-host, bs-host_disease,bs-isolation_source,bs-geo_loc_name,bs-lat_lon,bs-host_sex,bs-host_age,sra-file_location,sra-file_name,sra-library_name,sra-instrument_model,sra-library_strategy,sra-library_source,sra-library_selection,sra-library_layout,sra-library_construction_protocol,sra-loader,sequence_name,gb-subm_lab,gb-subm_lab_division,gb-subm_lab_addr,authors,gb-publication_status,gb-publication_title,gb-seq_id,src-isolate,collection_date,src-country,src-host,src-isolation_source,src-serotype,src-BioProject,src-BioSample,cmt-StructuredCommentPrefix,cmt-Assembly Method,cmt-Coverage,cmt-Sequencing Technology,cmt-StructuredCommentSuffix
seq1,CDC-OAMD,CDC Test,Monkeypox virus,PRJNA512913,MPXV/human/USA/GA_2741/2020,Helix,Pathogen.cl.1.0,3/28/2020,Homo sapiens,Monkeypox virus,nasal swab,United States: Georgia,Unknown,Male,28,local,"fastq_1_R1.fastq.gz, fastq_1_R2.fastq.gz",Other Test,Illumina NovaSeq 6000,AMPLICON,VIRAL RNA,RT-PCR,PAIRED,Helix Hybrid-Capture Test,latf-load,seq1,NIH,NCBI,"10 Center Dr, Bethesda, MD, USA 20895","Doe, John, R.; Doe, Jane;",unpublished,,MPXV/human/USA/GA_2741/2020,MPXV/human/USA/GA_2741/2020,3/28/2020,USA: GA,Homo sapiens,missing,Clade 1,PRJNA512913,SAMN02224951,Assembly-Data,Newbler v. 2.3,100x,Illumina ,Assembly-Data
seq2,CDC-OAMD,CDC Test,Monkeypox virus,PRJNA512962,MPXV/human/USA/GA_3742/2020,Helix,Pathogen.cl.1.0,4/29/2020,Homo sapiens,Monkeypox virus,nasal swab,United States: Georgia,Unknown,Male,45,,,,,,,,,,,seq2,NIH,NCBI,"10 Center Dr, Bethesda, MD, USA 20895","Doe, John; Doe, Jane;",unpublished,,MPXV/human/USA/GA_3742/2020,MPXV/human/USA/GA_3742/2020,4/29/2020,USA: GA,Homo sapiens,missing,Clade 1,PRJNA512962,SAMN02224986,Assembly-Data,Newbler v. 2.3,100x,Illumina,Assembly-Data
Binary file added OTHER_species/raw_reads/fastq_1_R1.fastq.gz
Binary file not shown.
Binary file added OTHER_species/raw_reads/fastq_1_R2.fastq.gz
Binary file not shown.
Binary file added OTHER_species/raw_reads/fastq_2_R1.fastq.gz
Binary file not shown.
Binary file added OTHER_species/raw_reads/fastq_2_R2.fastq.gz
Binary file not shown.
750 changes: 750 additions & 0 deletions OTHER_species/sequence.fasta

Large diffs are not rendered by default.

94 changes: 94 additions & 0 deletions OTHER_species/submission_files/BIOSAMPLE/submission.xml
Original file line number Diff line number Diff line change
@@ -0,0 +1,94 @@
<?xml version='1.0' encoding='utf-8'?>
<Submission>
<Description>
<Title>test_submission</Title>
<Comment>This is a test submission</Comment>
<Organization type="institute" role="owner" org_id="12345">
<Name>CDC</Name>
<Contact email="[email protected]">
<Name>
<First>Jane</First>
<Last>Doe</Last>
</Name>
</Contact>
</Organization>
</Description>
<Action>
<AddData target_db="BioSample">
<Data content_type="xml">
<XmlContent>
<BioSample schema_version="2.0">
<SampleId>
<SPUID spuid_namespace="CDC-OAMD">seq1</SPUID>
</SampleId>
<Descriptor>
<Title>CDC Test</Title>
</Descriptor>
<Organism>
<OrganismName>Monkeypox virus</OrganismName>
</Organism>
<BioProject>
<PrimaryId db="BioProject">PRJNA512913</PrimaryId>
</BioProject>
<Package>Pathogen.cl.1.0</Package>
<Attributes>
<Attribute attribute_name="isolate">MPXV/human/USA/GA_2741/2020</Attribute>
<Attribute attribute_name="collected_by">Helix</Attribute>
<Attribute attribute_name="collection_date">3/28/2020</Attribute>
<Attribute attribute_name="host">Homo sapiens</Attribute>
<Attribute attribute_name="host_disease">Monkeypox virus</Attribute>
<Attribute attribute_name="isolation_source">nasal swab</Attribute>
<Attribute attribute_name="geo_loc_name">United States: Georgia</Attribute>
<Attribute attribute_name="lat_lon">Unknown</Attribute>
<Attribute attribute_name="host_sex">Male</Attribute>
<Attribute attribute_name="host_age">28</Attribute>
<Attribute attribute_name="collection_date">2020-03-28</Attribute>
</Attributes>
</BioSample>
</XmlContent>
</Data>
<Identifier>
<SPUID spuid_namespace="CDC-OAMD_bs">seq1</SPUID>
</Identifier>
</AddData>
</Action>
<Action>
<AddData target_db="BioSample">
<Data content_type="xml">
<XmlContent>
<BioSample schema_version="2.0">
<SampleId>
<SPUID spuid_namespace="CDC-OAMD">seq2</SPUID>
</SampleId>
<Descriptor>
<Title>CDC Test</Title>
</Descriptor>
<Organism>
<OrganismName>Monkeypox virus</OrganismName>
</Organism>
<BioProject>
<PrimaryId db="BioProject">PRJNA512962</PrimaryId>
</BioProject>
<Package>Pathogen.cl.1.0</Package>
<Attributes>
<Attribute attribute_name="isolate">MPXV/human/USA/GA_3742/2020</Attribute>
<Attribute attribute_name="collected_by">Helix</Attribute>
<Attribute attribute_name="collection_date">4/29/2020</Attribute>
<Attribute attribute_name="host">Homo sapiens</Attribute>
<Attribute attribute_name="host_disease">Monkeypox virus</Attribute>
<Attribute attribute_name="isolation_source">nasal swab</Attribute>
<Attribute attribute_name="geo_loc_name">United States: Georgia</Attribute>
<Attribute attribute_name="lat_lon">Unknown</Attribute>
<Attribute attribute_name="host_sex">Male</Attribute>
<Attribute attribute_name="host_age">45</Attribute>
<Attribute attribute_name="collection_date">2020-04-29</Attribute>
</Attributes>
</BioSample>
</XmlContent>
</Data>
<Identifier>
<SPUID spuid_namespace="CDC-OAMD_bs">seq2</SPUID>
</Identifier>
</AddData>
</Action>
</Submission>
88 changes: 88 additions & 0 deletions OTHER_species/submission_files/GENBANK/authorset.sbt
Original file line number Diff line number Diff line change
@@ -0,0 +1,88 @@
Submit-block ::= {
contact {
contact {
name name {
last "Doe",
first "Jane",
middle "",
initials "",
suffix "",
title ""
},
affil std {
affil "Centers for Disease Control and Prevention",
div "Respiratory Viruses Branch, Division of Viral Diseases",
city "Atlanta",
sub "GA",
country "USA",
street "1600 Clifton Rd",
email "[email protected]",
phone "",
postal-code "30329"
}
}
},
cit {
authors {
names std {
{
name name {
last "Doe",
first "John",
suffix "R."
}
},
{
name name {
last "Doe",
first "Jane"
}
}
},
affil std {
affil "Centers for Disease Control and Prevention",
div "Respiratory Viruses Branch, Division of Viral Diseases",
city "Atlanta",
sub "GA",
country "USA",
street "1600 Clifton Rd",
postal-code "30329"
}
}
},
subtype new
}
Seqdesc ::= pub {
pub {
gen {
cit "unpublished",
authors {
names std {
{
name name {
last "Doe",
first "John",
suffix "R."
}
},
{
name name {
last "Doe",
first "Jane"
}
}
}
},
title ""
}
}
}
Seqdesc ::= user {
type str "Submission",
data {
{
label str "AdditionalComment",
data str "Submission Title: OTHER_species"
}
}
}
4 changes: 4 additions & 0 deletions OTHER_species/submission_files/SRA/raw_reads_location.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,4 @@
/scicomp/home-pure/psv4/seqsender_dev/seqsender/OTHER_species/raw_reads/fastq_1_R1.fastq.gz
/scicomp/home-pure/psv4/seqsender_dev/seqsender/OTHER_species/raw_reads/fastq_2_R2.fastq.gz
/scicomp/home-pure/psv4/seqsender_dev/seqsender/OTHER_species/raw_reads/fastq_2_R1.fastq.gz
/scicomp/home-pure/psv4/seqsender_dev/seqsender/OTHER_species/raw_reads/fastq_1_R2.fastq.gz
78 changes: 78 additions & 0 deletions OTHER_species/submission_files/SRA/submission.xml
Original file line number Diff line number Diff line change
@@ -0,0 +1,78 @@
<?xml version='1.0' encoding='utf-8'?>
<Submission>
<Description>
<Title>test_submission</Title>
<Comment>This is a test submission</Comment>
<Organization type="institute" role="owner" org_id="12345">
<Name>CDC</Name>
<Contact email="[email protected]">
<Name>
<First>Jane</First>
<Last>Doe</Last>
</Name>
</Contact>
</Organization>
</Description>
<Action>
<AddFiles target_db="SRA">
<File file_path="fastq_1_R1.fastq.gz">
<DataType>generic-data</DataType>
</File>
<File file_path="fastq_1_R2.fastq.gz">
<DataType>generic-data</DataType>
</File>
<Attribute name="library_name">Other Test</Attribute>
<Attribute name="instrument_model">Illumina NovaSeq 6000</Attribute>
<Attribute name="library_strategy">AMPLICON</Attribute>
<Attribute name="library_source">VIRAL RNA</Attribute>
<Attribute name="library_selection">RT-PCR</Attribute>
<Attribute name="library_layout">PAIRED</Attribute>
<Attribute name="library_construction_protocol">Helix Hybrid-Capture Test</Attribute>
<Attribute name="loader">latf-load</Attribute>
<AttributeRefId name="BioProject">
<RefId>
<PrimaryId>PRJNA512913</PrimaryId>
</RefId>
</AttributeRefId>
<AttributeRefId name="BioSample">
<RefId>
<SPUID spuid_namespace="CDC-OAMD_bs">seq1</SPUID>
</RefId>
</AttributeRefId>
<Identifier>
<SPUID spuid_namespace="CDC-OAMD_sra">seq1</SPUID>
</Identifier>
</AddFiles>
</Action>
<Action>
<AddFiles target_db="SRA">
<File file_path="fastq_2_R1.fastq.gz">
<DataType>generic-data</DataType>
</File>
<File file_path="fastq_2_R2.fastq.gz">
<DataType>generic-data</DataType>
</File>
<Attribute name="library_name">Other Test</Attribute>
<Attribute name="instrument_model">Illumina NovaSeq 6000</Attribute>
<Attribute name="library_strategy">AMPLICON</Attribute>
<Attribute name="library_source">VIRAL RNA</Attribute>
<Attribute name="library_selection">RT-PCR</Attribute>
<Attribute name="library_layout">PAIRED</Attribute>
<Attribute name="library_construction_protocol">Helix Hybrid-Capture Test</Attribute>
<Attribute name="loader">latf-load</Attribute>
<AttributeRefId name="BioProject">
<RefId>
<PrimaryId>PRJNA512962</PrimaryId>
</RefId>
</AttributeRefId>
<AttributeRefId name="BioSample">
<RefId>
<SPUID spuid_namespace="CDC-OAMD_bs">seq2</SPUID>
</RefId>
</AttributeRefId>
<Identifier>
<SPUID spuid_namespace="CDC-OAMD_sra">seq2</SPUID>
</Identifier>
</AddFiles>
</Action>
</Submission>
35 changes: 35 additions & 0 deletions POX_species/config.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,35 @@
Submission:
NCBI:
Username: username
Password: password
Table2asn: True
Submission_Position: 1
Description:
Title: test_submission
Comment: This is a test submission
Organization:
'@role': owner
'@type': institute
'@org_id': 12345
Name: CDC
Address:
Affil: Centers for Disease Control and Prevention
Div: Respiratory Viruses Branch, Division of Viral Diseases
Street: 1600 Clifton Rd
City: Atlanta
Sub: GA
Postal_code: 30329
Country: USA
Email: [email protected]
Phone: ""
Submitter:
'@email': [email protected]
'@alt_email':
Name:
First: Jane
Last: Doe
GISAID:
Client-Id: TEST-EA76875B00C3
Username: username
Password: password
Submission_Position: 2
3 changes: 3 additions & 0 deletions POX_species/metadata.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
ncbi-spuid,ncbi-spuid_namespace,bs-description,organism,ncbi-bioproject,bs-isolate,bs-collected_by,bs-package,collection_date,bs-host,bs-host_disease,bs-isolation_source,bs-geo_loc_name,bs-lat_lon,bs-host_sex,bs-host_age,sra-file_location,sra-file_name,sra-library_name,sra-instrument_model,sra-library_strategy,sra-library_source,sra-library_selection,sra-library_layout,sra-library_construction_protocol,sra-loader,sequence_name,gb-subm_lab,gb-subm_lab_division,gb-subm_lab_addr,authors,gb-publication_status,gb-publication_title,gb-seq_id,src-isolate,src-country,src-host,src-isolation_source,src-serotype,src-BioProject,src-BioSample,cmt-StructuredCommentPrefix,cmt-Assembly Method,cmt-Coverage,cmt-Sequencing Technology,cmt-StructuredCommentSuffix,gs-seq_id,gs-virus_name,gs-passage,gs-collection_date,gs-location,gs-add_location,gs-host,gs-add_host_info,gs-sampling_strategy,gs-gender,gs-patient_age,gs-patient_status,gs-specimen,gs-outbreak,gs-last_vaccinated,gs-treatment,gs-seq_technology,gs-assembly_method,gs-coverage,gs-orig_lab,gs-orig_lab_addr,gs-provider_sample_id,gs-subm_lab,gs-subm_lab_addr,gs-subm_sample_id,gs-consortium,gs-comment,gs-comment_type
seq1,CDC-OAMD,CDC Test,Monkeypox virus,PRJNA512913,MPXV/human/USA/GA_2741/2020,Helix,Pathogen.cl.1.0,3/28/2020,Homo sapiens,Monkeypox virus,nasal swab,United States: Georgia,Unknown,Male,28,local,"fastq_1_R1.fastq.gz, fastq_1_R2.fastq.gz",Other Test,Illumina NovaSeq 6000,AMPLICON,VIRAL RNA,RT-PCR,PAIRED,Helix Hybrid-Capture Test,latf-load,seq1,NIH,NCBI,"10 Center Dr, Bethesda, MD, USA 20895","Doe, John, R.; Doe, Jane;",unpublished,,MPXV/human/USA/GA_2741/2020,MPXV/human/USA/GA_2741/2020,USA: GA,Homo sapiens,missing,Clade 1,PRJNA512913,SAMN02224951,Assembly-Data,Newbler v. 2.3,100x,Illumina ,Assembly-Data,MPXV/Anzark/12/2022,MPXV/Anzark/12/2022,Original,3/28/2022,Oceania/Australia/Melbourne,unknown,Human,,,unknown,unknown,unknown,,,,,Illumina NextSeq 550,,3000x,Bio1 Mel,"16 Info St, Mel, Aus",,Bio2 Mel,"32 Data St, Mel, Aus",,,,
seq2,CDC-OAMD,CDC Test,Monkeypox virus,PRJNA512962,MPXV/human/USA/GA_3742/2020,Helix,Pathogen.cl.1.0,4/29/2020,Homo sapiens,Monkeypox virus,nasal swab,United States: Georgia,Unknown,Male,45,local,"fastq_2_R1.fastq.gz, fastq_2_R2.fastq.gz",Other Test,Illumina NovaSeq 6000,AMPLICON,VIRAL RNA,RT-PCR,PAIRED,Helix Hybrid-Capture Test,latf-load,seq2,NIH,NCBI,"10 Center Dr, Bethesda, MD, USA 20895","Doe, John; Doe, Jane;",unpublished,,MPXV/human/USA/GA_3742/2020,MPXV/human/USA/GA_3742/2020,USA: GA,Homo sapiens,missing,Clade 1,PRJNA512962,SAMN02224986,Assembly-Data,Newbler v. 2.3,100x,Illumina,Assembly-Data ,MPXV/Anzark/13/2022,MPXV/Anzark/13/2022,Original,3/28/2022,Oceania/Australia/Melbourne,unknown,Human,,,unknown,unknown,unknown,,,,,Illumina NextSeq 550,,3000x,Bio1 Mel,"16 Info St, Mel, Aus",,Bio2 Mel,"33 Data St, Mel, Aus",,,,
Binary file added POX_species/raw_reads/fastq_1_R1.fastq.gz
Binary file not shown.
Binary file added POX_species/raw_reads/fastq_1_R2.fastq.gz
Binary file not shown.
Binary file added POX_species/raw_reads/fastq_2_R1.fastq.gz
Binary file not shown.
Binary file added POX_species/raw_reads/fastq_2_R2.fastq.gz
Binary file not shown.
Loading

0 comments on commit 573e1a6

Please sign in to comment.