##################################
#                                #
# Last modified 2018/09/25       # 
#                                #
# Georgi Marinov                 #
#                                # 
##################################

import sys

def run():

    if len(sys.argv) < 3:
        print 'usage: python %s inputfilename sequenceFieldID labelFieldID [-minSeqLen number]' % sys.argv[0]
        print '\tthe script accepts stdin as input'
        print '\tthe script will print to stdout'
        sys.exit(1)

    inputfilename = sys.argv[1]
    seqFieldID = int(sys.argv[2])
    labelFieldID = int(sys.argv[3])

    SeqDict = {}

    if inputfilename == '-':
        lineslist  = sys.stdin
    else:
        lineslist  = open(inputfilename)
    i=0
    for line in lineslist:
        if line.startswith('#'):
            continue
        fields = line.strip().split('\t')
        seq = fields[seqFieldID]
        label = fields[labelFieldID]
        if SeqDict.has_key(seq):
            pass
        else:
            SeqDict[seq] = []
        SeqDict[seq].append(label)

    for seq in SeqDict.keys():
        outline = ''
        for label in SeqDict[seq]:
            outline = outline + ',' + label
        print '>' + outline[1:]
        print seq

run()

