Skip to content

Commit

Permalink
pub data
Browse files Browse the repository at this point in the history
  • Loading branch information
kenminsoo committed Aug 4, 2023
1 parent 8914aa6 commit a5d63d1
Show file tree
Hide file tree
Showing 14 changed files with 19,595 additions and 22 deletions.
Binary file modified .DS_Store
Binary file not shown.
1 change: 0 additions & 1 deletion .gitignore
Original file line number Diff line number Diff line change
@@ -1,7 +1,6 @@
testing_env/
RNA_central/
SPRMT_merge_031323_seq.gtf
*.fa
*.fai
*.tsv
.Rproj.user
Expand Down
Binary file modified __pycache__/gtf_groundtruth.cpython-310.pyc
Binary file not shown.
20 changes: 10 additions & 10 deletions sRNA_frag_config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -16,12 +16,12 @@ module_options:
# for our cell line samples, UMIs and Adapters are already removed.
# We add adapter trimming time from 9 core run.
umi_removal:
bool: False
bool: True
regex: ".+(?P<discard_1>AACTGTAGGCACCATCAAT){s<=2}(?P<umi_1>.{12}).+"

# Remove Adapters, Default is Illumina universal
adapter_removal:
bool: False
bool: True
sequence: AGATCGGAAGAG

# An annotation file to generate fragments from => Should be filtered with sequences
Expand Down Expand Up @@ -55,13 +55,13 @@ module_options:

# from ITAS publication
# merged with snoDB
annotation_file: ""
annotation_file: "/Users/kenminsoo/Desktop/unprocessed-annotations/testing_env/SPRMT_merge_031323_seq.gtf"

# Find out of space maps
find_out_bool: False
find_out_bool: True

# Indexed reference genome for out of space maps
built_index_location: ""
built_index_location: "/Users/kenminsoo/Desktop/unprocessed-annotations/hg38"

# Plot counts vs. fragment location on every souce transcript
plot_every_source: True
Expand All @@ -77,19 +77,19 @@ module_options:
SUMMARY: True

# Delete the working directory
delete_working: True
delete_working: False

system_options:
# Max number of cores to use
num_cores: 9
num_cores: 5
# Keep this amount of memory free in G
mem_free: 2

# Use full paths, Do not end path with / (i.e. /bin/bash not /bin/bash/)
dir_locations:
# Set the working dir
working_dir: "/Users/kenminsoo/Desktop/Projects/JABSOM/Nakatsu/projects/tools/install/test_results/working"
working_dir: "/Volumes/Extreme_SSD/Lung_smRNAseq-2021_BW/working"
# Location of samples (ENSURE *.fastq.gz)
sample_dir: "/Users/kenminsoo/Desktop/Projects/JABSOM/Nakatsu/projects/tools/install/test_data"
sample_dir: "/Volumes/Extreme_SSD/Lung_smRNAseq-2021_BW"
# Dir to output files
out_dir: "/Users/kenminsoo/Desktop/Projects/JABSOM/Nakatsu/projects/tools/install/test_results/out"
out_dir: "/Volumes/Extreme_SSD/Lung_smRNAseq-2021_BW/out_sno"
19 changes: 11 additions & 8 deletions sRNA_fragment.py
Original file line number Diff line number Diff line change
Expand Up @@ -38,7 +38,17 @@

## -- Config Variables -- ##

if P2_bool == True:
os.system("cp sRNA_frag_config.yaml " + out_dir + ";\
cp sRNA_fragment_P2.py " + out_dir + ";\
cp gtf_groundtruth.py " + out_dir + ";\
cp gtf_modifiers.py " + out_dir + ";\
cp conversion_tools.py " + out_dir + ";\
cp alias_work.py " + out_dir + ";\
cp basics.py " + out_dir)

if P1_bool == True:
print("User can start running next instance of sRNAfrag.")
os.system("python sRNA_fragment_P1.py")

if S1_bool == True:
Expand All @@ -51,14 +61,7 @@
os.system("mkdir " + working_dir + "/aligned_sams")
os.system("cp scripts/.add_prefix_outspace.sh " + working_dir + "/aligned_sams")

os.system("cp sRNA_frag_config.yaml " + out_dir + ";\
cp sRNA_fragment_P2.py " + out_dir + ";\
cp gtf_groundtruth.py " + out_dir + ";\
cp gtf_modifiers.py " + out_dir + ";\
cp conversion_tools.py " + out_dir + ";\
cp alias_work.py " + out_dir + ";\
cp basics.py " + out_dir + ";\
cd " + out_dir + ";\
os.system("cd " + out_dir + ";\
python sRNA_fragment_P2.py")

# Clean up Module
Expand Down
6 changes: 6 additions & 0 deletions sRNA_fragment_P1.py
Original file line number Diff line number Diff line change
Expand Up @@ -227,6 +227,12 @@
print("Use ctrl-C to cancel pipeline.")
input()

# Remove the subset files
if remove_adapters_bool == True:
if fastqc_bool == True:
os.system("cd " + out_dir + ";\
rm -rf subset_*")

gtf_attribute_to_fasta(annotation_file, working_dir + "/transcriptome.fa", "sequence", "transcript_id", pipeline = True)

generate_index_bowtie(working_dir + "/transcriptome.fa", working_dir + "/transcriptome")
Expand Down
Binary file modified scripts/.DS_Store
Binary file not shown.
3,834 changes: 3,834 additions & 0 deletions scripts/pub_figs/anchored_mirna.fa

Large diffs are not rendered by default.

Loading

0 comments on commit a5d63d1

Please sign in to comment.