# count by gene ids grep '^Anoalb4EVm00' evg4anoalb.perfdup.pubids | egrep '(main|noclass)' | perl -ne 's/\tidb[fr]/\tidba/; s/\t(k\d)\d/\t${1}5/; ($pd,$oid,$sm,$sk,$sr,$aaq,$cla)= @v=split; $sm{$sm}{$pd}++; $sk{$sk}{$pd}++; $pd{$pd}++; $pds{$pd}{$sm}++; $pdk{$pd}{$sk}++; END{ @pd=sort keys %pd; $nt=@pd; print "assembler (longest $nt genes):\n"; for $sm (sort keys %sm) { @d=sort keys %{$sm{$sm}}; $nd=@d; $pd=100*$nd/$nt; $nu=0; map{ @m=keys %{$pds{$_}}; $nu++ if($pds{$_}{$sm} and @m==1); } @pd; $pu=100*$nu/$nt; printf "%5d,%4.1f%% %4d,%4.1f%%u %s\n",$nd,$pd,$nu,$pu,$sm; } print "kmer (longest $nt genes):\n"; for $sm (sort keys %sk) { @d=sort keys %{$sk{$sm}}; $nd=@d; $pd=100*$nd/$nt; $nu=0; map{ @m=keys %{$pdk{$_}}; $nu++ if($pdk{$_}{$sm} and @m==1); } @pd; $pu=100*$nu/$nt; printf "%5d,%4.1f%% %4d,%4.1f%%u %s\n",$nd,$pd,$nu,$pu,$sm; } } ' #------------------------- assembler (longest 9999 genes): 4622,46.2% 1464,14.6%u idba 2900,29.0% 352, 3.5%u soap 2408,24.1% 305, 3.1%u trin 7636,76.4% 4492,44.9%u velv kmer (longest 9999 genes): 2219,22.2% 80, 0.8%u k05 3903,39.0% 811, 8.1%u k25 5130,51.3% 1255,12.6%u k35 4897,49.0% 771, 7.7%u k45 4553,45.5% 492, 4.9%u k55 4764,47.6% 779, 7.8%u k65 4341,43.4% 544, 5.4%u k75 3920,39.2% 375, 3.8%u k85 3460,34.6% 168, 1.7%u k95 assembler (longest 999 genes): 477,47.7% 168,16.8%u idba 290,29.0% 49, 4.9%u soap 136,13.6% 20, 2.0%u trin 741,74.2% 441,44.1%u velv kmer (longest 999 genes): 160,16.0% 2, 0.2%u k05 301,30.1% 55, 5.5%u k25 519,52.0% 149,14.9%u k35 511,51.2% 90, 9.0%u k45 496,49.6% 78, 7.8%u k55 458,45.8% 67, 6.7%u k65 393,39.3% 29, 2.9%u k75 359,35.9% 27, 2.7%u k85 314,31.4% 10, 1.0%u k95 # all genes assembler (all 29049 genes): 12516,43.1% 4677,16.1%u idba 6911,23.8% 1288, 4.4%u soap 8070,27.8% 2599, 8.9%u trin 18729,64.5% 11929,41.1%u velv kmer (all 29049 genes): 7210,24.8% 620, 2.1%u k05 12381,42.6% 4473,15.4%u k25 12855,44.3% 3572,12.3%u k35 11109,38.2% 1906, 6.6%u k45 10141,34.9% 1192, 4.1%u k55 10700,36.8% 1858, 6.4%u k65 9949,34.2% 1424, 4.9%u k75 9619,33.1% 1402, 4.8%u k85 8423,29.0% 586, 2.0%u k95 #------------------------- assembler (BUSCOdmel 2561 genes): 1082,42.2% 309,12.1%u idba 692,27.0% 75, 2.9%u soap 569,22.2% 50, 2.0%u trin 2089,81.6% 1285,50.2%u velv kmer (BUSCOdmel 2561 genes): 458,17.9% 28, 1.1%u k05 957,37.4% 174, 6.8%u k25 1177,46.0% 251, 9.8%u k35 1169,45.6% 200, 7.8%u k45 1085,42.4% 133, 5.2%u k55 1203,47.0% 266,10.4%u k65 1070,41.8% 192, 7.5%u k75 950,37.1% 136, 5.3%u k85 787,30.7% 70, 2.7%u k95 assembler (drosmel 6725 genes): 2894,43.0% 868,12.9%u idba 1829,27.2% 207, 3.1%u soap 1568,23.3% 205, 3.0%u trin 5336,79.3% 3271,48.6%u velv kmer (drosmel 6725 genes): 1266,18.8% 64, 1.0%u k05 2515,37.4% 532, 7.9%u k25 3164,47.0% 772,11.5%u k35 3018,44.9% 516, 7.7%u k45 2808,41.8% 357, 5.3%u k55 3037,45.2% 644, 9.6%u k65 2717,40.4% 458, 6.8%u k75 2470,36.7% 362, 5.4%u k85 2095,31.2% 185, 2.8%u k95 #-----------------------------