Skip to content

Commit 0d1b76b

Browse files
removed files no longer available; changed output file names
1 parent 62a1b47 commit 0d1b76b

File tree

1 file changed

+8
-7
lines changed

1 file changed

+8
-7
lines changed

ncbigene/ncbigene.php

Lines changed: 8 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -39,10 +39,10 @@ class NCBIGeneParser extends Bio2RDFizer
3939
"gene2ensembl" => "gene2ensembl.gz",
4040
"gene2go" => "gene2go.gz",
4141
"gene2pubmed" => "gene2pubmed.gz",
42-
"gene2refseq" => "gene2refseq.gz",
43-
"gene2sts" => "gene2sts",
44-
"gene2unigene" => "gene2unigene",
45-
"gene2vega" => "gene2vega.gz",
42+
"gene2refseq" => "gene2refseq.gz"
43+
#"gene2sts" => "gene2sts",
44+
#"gene2unigene" => "gene2unigene",
45+
#"gene2vega" => "gene2vega.gz",
4646
);
4747
private $taxids = null;
4848
private $default_taxids = array(
@@ -64,7 +64,7 @@ function __construct($argv) {
6464
parent::__construct($argv,"ncbigene");
6565

6666
// set and print application parameters
67-
parent::addParameter('files',true,'all|geneinfo|gene2accession|gene2ensembl|gene2go|gene2pubmed|gene2refseq|gene2sts|gene2unigene|gene2vega','','files to process');
67+
parent::addParameter('files',true,'all|geneinfo|gene2accession|gene2ensembl|gene2go|gene2pubmed|gene2refseq','','files to process'); # |gene2sts|gene2unigene|gene2vega were removed
6868
parent::addParameter('download_url',false,null,'ftp://ftp.ncbi.nih.gov/gene/DATA/');
6969
parent::addParameter('limit_organisms',false,'true|false','true','flag to use specified organisms');
7070
parent::addParameter('organisms',false,null,implode(",",array_keys($this->default_taxids)),'taxonomy ids for organisms to process');
@@ -129,7 +129,7 @@ function process()
129129
$file = $module.".gz";
130130
$lfile = $ldir.$file;
131131
$rfile = $rdir.$rfilename;
132-
$ofile = $module.".".parent::getParameterValue('output_format');
132+
$ofile = "bio2rdf-".$module.".".parent::getParameterValue('output_format');
133133

134134
$gz = false;
135135
if(strstr(parent::getParameterValue('output_format'), "gz")) $gz = true;
@@ -140,6 +140,7 @@ function process()
140140
$fnx = $module;
141141
if($module == 'gene2refseq') $fnx = 'gene2accession';
142142
$this->$fnx();
143+
143144
parent::clear();
144145

145146
echo 'done!'.PHP_EOL;
@@ -343,7 +344,7 @@ private function gene2accession()
343344
$z = 1;
344345
while($l = $this->getReadFile()->read(200000)){
345346
if($l[0] == "#") continue;
346-
if(($z++) % 10000 == 0) {echo $z.PHP_EOL;parent::clear();}
347+
if(($z++) % 100000 == 0) {echo $z.PHP_EOL;parent::clear();}
347348
$a = explode("\t",rtrim($l));
348349
if(count($a) != 16) { trigger_error("gene2accession: expecting 16 columns, found ".count($a)." instead", E_USER_ERROR);}
349350
$taxid = $a[0];

0 commit comments

Comments
 (0)