Skip to content

Commit

Permalink
fix(design): allow additional file extensions in GEOFiles and improve…
Browse files Browse the repository at this point in the history
… processed data files handling
  • Loading branch information
alsmith151 committed Nov 15, 2024
1 parent 9a35988 commit 2fb24f0
Show file tree
Hide file tree
Showing 2 changed files with 9 additions and 3 deletions.
4 changes: 3 additions & 1 deletion seqnado/design.py
Original file line number Diff line number Diff line change
Expand Up @@ -929,6 +929,7 @@ class GEOFiles(BaseModel):
sample_names: List[str]
config: dict
design: pd.DataFrame
extensions_allowed: List[str] = [".txt", ".bigWig", ".bed", ".tsv", ".vcf.gz"]

processed_files: Optional[List[Union[str, pathlib.Path]]] = None

Expand All @@ -947,7 +948,8 @@ def md5sums(self):

@property
def processed_data_files(self) -> pd.DataFrame:
wanted_exts = [".txt", ".bigWig", ".bed", '.tsv']

wanted_exts = self.extensions_allowed
unwanted_files = [*self.md5sums]

# Create a DataFrame with the processed files
Expand Down
8 changes: 6 additions & 2 deletions seqnado/workflow/rules/geo_submission.smk
Original file line number Diff line number Diff line change
Expand Up @@ -37,8 +37,12 @@ def get_symlinked_files(wc: Any = None) -> List[str]:
processed_files=[str(p) for p in OUTPUT.files],
)

processed_files = geo_files.processed_data_files['output_file_name'].tolist()
processed_files = [outdir / fn for fn in processed_files]


if processed_files := geo_files.processed_data_files['output_file_name'].tolist():
processed_files = [outdir / fn for fn in processed_files]
else:
processed_files = []


return [*fastqs, *processed_files]
Expand Down

0 comments on commit 2fb24f0

Please sign in to comment.