BEGIN{ FS="\t"; #input all: #cluster # 1 2 3 4 _ 5 _ 6 _ 7 _ 8 _ 9 _ 10 11 12 # 1 2 3 4 5 6 #Chromosome,ClusterStart,ClusterEnd,ClusterID,ClusterSequence,ReadCount,ModeLocation,ConversionLocationCount,ConversionEventCountC,NonConversionEventCount,ModeScore,Strand #group/dist # 7 8 9 10 11 12 #Chromosome,ClusterStart,ClusterEnd,ClusterID,AvgConversionPct,ConversionEventCountG,SdevConversionPct, MaxConversionPct ,Strand #example: # 1 2 3 4 5 6 7 8 9 10 11 12 #in: ENSMUST00000000254-chr6-+-128884399-128885000 278 324 G5.2_ATTAGTTATTCTATTGGAGTATACAATACTCGAATAGTTCTCAGGCA_275_317_5_96_1643 0.7790820460717197 + ENSMUST00000000254-chr6-+-128884399-128885000 163 374 G5_0.004717_212_0.019691 0.126365 + #out: # 1 2 3 4 6 7 #Chromosome,ClusterStart,ClusterEnd,ClusterID,ClusterSequence,ReadCount,ModeLocation,ConversionLocationCount,ConversionEventCount,NonConversionEventCount,ModeScore,AvgConversionPct,ConversionEventCount,SdevConversionPct, MaxConversionPct ,Strand #Chromosome,ClusterStart,ClusterEnd,ClusterID_ClusterSequence_ReadCount_ModeLocation_ConversionLocationCount_ConversionEventCountC_NonConversionEventCount_ModeScore_AvgConversionPct_ConversionEventCountG_SdevConversionPct, MaxConversionPct ,Strand }{ split($10,ginfo,"_"); #group_info #AvgConversionPct_ConversionEventCount_SdevConversionPct MaxConversionPct # if (substr($1,1,4)!="Chro") { # print $1"\t"$3-1"\t"$4-1"\t"$5"_"$7"_"$9"\t"$8"\t"$2; ##Chromosome,ClusterStart,ClusterEnd,ClusterID, ,AvgConversionPct,MaxConversionPct,ConversionEventCount print $1"\t"$2"\t"$3"\t"$4"_"$5"_"ginfo[2]"_"ginfo[3]"_"ginfo[4]"\t"$11"\t"$6; # } }