-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathparseOutGenesMI.pl
More file actions
38 lines (35 loc) · 1.1 KB
/
parseOutGenesMI.pl
File metadata and controls
38 lines (35 loc) · 1.1 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
#parseOutGenesZI.pl
#this script runs through all of the paralogs identified and all of the genes in an organism
#and creates a list of all those genes that are not involved, so far, in a paralog relationship
#with small changes this file will be run on in and out paralogs for mice and zebrafish
#file to store paralogs that need to be checked
open(OUT,">unCheckedMouseInParalogs.txt") ||die("unCheckedMouseInParalogs.txt does not open");
open(OUT2,">checkedMouseInParalogs.txt") ||die("checkedMouseInParalogs.txt does not open");
#read in full list of genes
open(IN1,"mouseGenes.txt")||die("mouseGenes.txt does not open");
#read in paralogs
open(IN2,"mouseInParalogs.txt")||die("mouseInParalogs.txt does not open");
@genes = <IN1>;
@paralogs = <IN2>;
$count = 0;
#run through all genes
foreach $gene (@genes){
@columns = split(" ",$gene);
$ID = $columns[1];
$found = 0;
#run through paralog list
foreach $log (@paralogs){
if($log =~ m/$ID/){
$found = 1;
last;
}
}
if(!$found){
print OUT "$ID\n";
$count ++;
}
else{
print OUT2 "$ID\n";
}
}
print "$count genes yet to be found \n";