Skip to content
Snippets Groups Projects
Commit 8c9c4078 authored by Emmanuel Mongin's avatar Emmanuel Mongin
Browse files

dros options

parent 39664ac0
No related branches found
No related tags found
No related merge requests found
......@@ -19,7 +19,7 @@ my $organism = $conf{'organism'};
my $sptr_swiss = $conf{'sptr_swiss'};
my $out = $conf{'x_map_out'};
#Get specific options for human/mouse/rat
#Get specific options for human/mouse/rat/drosophila
my $refseq_gnp = $conf{'refseq_gnp'};
#Get specific options for human
......@@ -42,6 +42,8 @@ my $eleg_nom = $conf{'eleg_nom'};
my $zeb_gene = $conf{'zeb_gene'};
my $zeb_dblink = $conf{'zeb_dblink'};
#Get specific options for drosophila
my $ext_annot = $conf{'dros_ext_annot'};
my $briggsae_peptides = $conf{'briggsae_hybrid'};
......@@ -63,7 +65,7 @@ my ($swiss, $ac, $id) = &parse_sp_file($sptr_swiss);
&process_parsed_sp($swiss, $ac, $id, \*OUT);
if (($organism eq "human") || ($organism eq "mouse") || ($organism eq "rat") || ($organism eq "zebrafish")) {
if (($organism eq "human") || ($organism eq "mouse") || ($organism eq "rat") || ($organism eq "zebrafish") || ($organism eq "drosophila")) {
#Read the refseq file in gnp format
print STDERR "Reading REFSEQ File\n";
......
......@@ -28,10 +28,10 @@ package main;
#The mapping to known genes is assymetrical. This is due to the fact that's our gene prediction is quite fragmented compared to the manually curated genes
#'query_idt' => 40,
'query_idt' => ,
'query_idt' => 50,
#'target_idt => 10,
'target_idt' => ,
'target_idt' => 50,
......@@ -47,7 +47,7 @@ package main;
#Location of the query peptide file (eg: Ensembl predicted protein)
#'query' => '/work1/mongin/mapping/primary/ensembl110.pep',
'query' => '',
'query' => '/acari/work4/mongin/dros3_mapping/Primary/drosophila-release3-peptides.fasta',
#Location of the sptr file, this file will be used as an
#input to grep the specific sp entries to the organism
......@@ -58,32 +58,32 @@ package main;
#Location of the sptr file in fasta format containing the entries specific to the organism
#'sptr_fa' => '/work1/mongin/mapping/primary/HS.f',
'sptr_fa' => '',
'sptr_fa' => '/acari/work4/mongin/dros3_mapping/Primary/7227.FASTAC',
#Location of the sptr file in Swiss-Prot format containing the entries specific to the organism
#'sptr_swiss' => '/ecs2/work1/lec/briggsae_peptides/briggsae.test',
'sptr_swiss' => '',
'sptr_swiss' => '/acari/work4/mongin/dros3_mapping/Primary/7227.SPC',
#Location of the file containing all refseq and all SP in fasta format (This file will be produced by running prepare_proteome.pl)
'pmatch_input_fa' => '',
'pmatch_input_fa' => '/acari/work4/mongin/dros3_mapping/Primary/total.fa',
#Output file containing the mapping of SP and refseq sequences to external databases
'x_map_out' => '',
'x_map_out' => '/acari/work4/mongin/dros3_mapping/Output/xmap.out',
#Output file from pmatch.pl and input file for maps2db.pl
#'pmatch_out' => '/work1/mongin/mapping/outputs/pmatch_human1.txt',
'pmatch_out' => '',
'pmatch_out' => '/acari/work4/mongin/dros3_mapping/Output/pmatch.out',
#Location of the Refseq (proteins) file in fasta format
#'refseq_fa' => '/work1/mongin/mapping/primary/refseq.fa',
'refseq_fa' => '',
'refseq_fa' => '/acari/work4/mongin/dros3_mapping/Primary/fly.faa',
#Location of the Refseq (proteins) file in Genbank format
#'refseq_gnp' => '/work1/mongin/mouse/mapping/primary/mouse.gnp',
'refseq_gnp' => '',
'refseq_gnp' => '/acari/work4/mongin/dros3_mapping/Primary/fly.gnp',
############################################
#Organism specific files for the X_mapping #
......@@ -147,7 +147,7 @@ package main;
#drosophila#
############
'dros_ext_annot' => '',
'dros_ext_annot' => '/acari/work4/mongin/dros3_mapping/Primary/xrefs.txt',
##########
......@@ -184,7 +184,7 @@ package main;
#Location for pmatch binaries
#'pmatch' => '/nfs/disk65/ms2/bin/pmatch'
'pmatch' => '/nfs/disk65/ms2/bin/pmatch',
'pmatch' => '/nfs/disk5/ms2/bin/pmatch',
......@@ -195,7 +195,7 @@ package main;
#Name of the organism studied. Current keywords used(or planned to be used): human, drosophila, mouse, elegans, anopheles, zebrafish
#You can adapt the other scripts given the organisms (eg: do some specific x_mapping for a given organism)
#'organism' => 'human'
'organism' => '',
'organism' => 'drosophila',
#OX (Organism taxonomy cross-reference) number
......
......@@ -59,7 +59,9 @@ my $organism = $conf{'organism'};
my $refseq_pred = $conf{'refseq_pred_fa'};
my $sub_genes = $conf{'submitted_genes'};
if (($organism eq "human") || ($organism eq "mouse") || ($organism eq "rat")) {
print STDERR "Prepare proteome using following files: SPTR ($sptr)\nREFSEQ ($refseq)\nPROTFILE ($protfile)\n";
if (($organism eq "human") || ($organism eq "mouse") || ($organism eq "rat") || ($organism eq "drosophila")) {
&parse_refseq;
}
......
......@@ -37,7 +37,7 @@ my %query2length;
#################################
# run scanwisepep
my $scanwise = "/nfs/acari/birney/prog/wise2/src/models/scanwisep -seqdb $target $query -seqloadtile 5 -hspthread -hspthreadno 4 -hsp2hit_best -hsp2hit_best_perc 10 -hitoutput tab >> /tmp/$$.pmatch";
my $scanwise = "/usr/local/ensembl/bin/scanwisep-2.2.3-rc6 -seqdb $target $query -seqloadtile 5 -hspthread -hspthreadno 4 -hsp2hit_best -hsp2hit_best_perc 10 -hitoutput tab >> /tmp/$$.pmatch";
print STDERR "Running Scanwise: $scanwise\n";
......
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment