-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathparseOutGenesMO.pl
More file actions
34 lines (31 loc) · 1000 Bytes
/
parseOutGenesMO.pl
File metadata and controls
34 lines (31 loc) · 1000 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
#parseOutGenesZI.pl
#this script runs through all of the paralogs identified and all of the genes in an organism
#and creates a list of all those genes that are not involved, so far, in a paralog relationship
#with small changes this file will be run on in and out paralogs for mice and zebrafish
#file to store paralogs that need to be checked
open(OUT,">unCheckedMouseOutParalogs.txt") ||die("unCheckedMouseOutParalogs.txt does not open");
#read in full list of genes
open(IN1,"mouseGenes.txt")||die("mouseGenes.txt does not open");
#read in paralogs
open(IN2,"mouseOutParalogs.txt")||die("mouseOutParalogs.txt does not open");
@genes = <IN1>;
@paralogs = <IN2>;
$count = 0;
#run through all genes
foreach $gene (@genes){
@columns = split(" ",$gene);
$ID = $columns[1];
$found = 0;
#run through paralog list
foreach $log (@paralogs){
if($log =~ m/$ID/){
$found = 1;
last;
}
}
if(!$found){
print OUT "$ID\n";
$count ++;
}
}
print "$count genes yet to be found \n";