Select Code to Download

Select or download this

my %dict =  map { chomp; split "\t", $_, 2 } <$fh>;

Select or download this

 > grpsTbl <- read.csv("Orthogroups_3.csv", header=T, sep = "\t", row.
+names = 1, stringsAsFactors=F)

Select or download this

"PBANKA_0000600, PBANKA_0000701, PBANKA_0000801, PBANKA_0001001, PBANK
+A_0001101, PBANKA_0001201, PBANKA_0001301, PBANKA_0001401, PBANKA_000
+1501, PBANKA_0006300, PBANKA_0006401, PBANKA_0006501, PBANKA_0006600,
+ PBANKA_0006701,"

Select or download this

"PmUG01_00010100.1-p1, PmUG01_00010200.1-p1, PmUG01_00010400.1-p1, PmU
+G01_00010500.1-p1, PmUG01_00010600.1-p1, PmUG01_00010700.1-p1, PmUG01
+_00010800.1-p1, PmUG01_00010900.1-p1, PmUG01_00011000.1-p1, PmUG01_00
+011300.1-p1, PmUG01_00011400.1-p1, PmUG01_00011600.1-p1, PmUG01_00011
+700.1-p1, PmUG01_00012100.1-p1, PmUG01_00012200.1-p1,"

Select or download this

PVX_088085    Protein processing in endoplasmic reticulum    
PVX_114095    Protein processing in endoplasmic reticulum    
...
PYYM_1032000    -    
PYYM_1120600    -
PCYB_031930    Purine metabolism; Metabolic pathways; DNA replication;
+ Pyrimidine metabolism

Select or download this

for my $k (keys %dict) {
  my $v=$dict{$k}; 
  warn 'for lookup:'.$k.' tab in field:'.$v."\n" if ($v=~"\t"); 
  }

Select or download this

for lookup:PVX_114095 tab in field:Protein processing in endoplasmic r
+eticulum
for lookup:PYYM_1032000 tab in field:-
for lookup:PVX_088085 tab in field:Protein processing in endoplasmic r
+eticulum

Select or download this

 
# This script was excerpted from http://stackoverflow.com/questions/11
+678939/replace-text-based-on-a-dictionary
...
  s/($re)/$dict{$1}/g;
  print;
}