#! /usr/local/bin/gawk -f # rgs, imim.sb, aug 98 BEGIN{ # default source name, overrided by seqname="seqname" source="genscan"; # genescan data structure exonid = 1; strand = 3; start = 4; end = 5; feature = 2; frame = 7; score = 13; # gff features gff_feature["Intr"]="Internal"; gff_feature["Term"]="Terminal"; gff_feature["Init"]="First"; gff_feature["Sngl"]="Single"; # gff formatted output gff_format="%s\t%s\t%s\t%d\t%d\t%.2f\t%s\t%s\t%s\n"; } ($1 == "Sequence") { seqname=$2; } $2 in gff_feature { group=substr($exonid,1,index($exonid,".")-1); # print always lower position first if ($start > $end) { aux=end; end=start; start=aux; } printf gff_format, seqname, source, gff_feature[$feature], $start, $end, $score, $strand, $frame, group+0; }