BEGIN{RS="";ORS="\n\n"; FS="\n"}
{seq
="";for(i
=2;i
<=NF
;++i
) seq
=seq
toupper($i
)} !(seq in a){print; a[seq]}
QkVHSU57UlM9IiI7T1JTPSJcblxuIjsgRlM9IlxuIn0KICAgICAgIHtzZXE9IiI7Zm9yKGk9MjtpPD1ORjsrK2kpIHNlcT1zZXEgdG91cHBlcigkaSl9CiAgICAgICAhKHNlcSBpbiBhKXtwcmludDsgYVtzZXFdfQ==
Jmd0O3NlcXVlbmNlMV9DUCBbc2VxICB2aXJ1c10KTVFDS1NHVE5OVkZUQUlLWVRUTk5OSUlZS1NFTk5ETklJRlRLTklGTlZWVFRLREFGSUZTS05SR0lNTkwKRElUS0tGRFlIRUhSUEtMQ1ZGS0lJTlRRWVZOU1BFS01JREFXUFRNRElWQUxJVEUKCiZndDtzZXF1ZW5jZTIgW3ZpcnVzXQpNUUNLU0dUTk5WRlRBSUtZVFROTk5JSVlLU0VOTkROSUlGVEtOSUZOVlZUVEtEQUZJRlNLTlJHSU1OTApESVRLS0ZEWUhFSFJQS0xDVkZLSUlOVFFZVk5TUEVLTUlEQVdQVE1ESVZBTElURQoKJmd0O3NlcXVlbmNlMwpNUUNLU0dUTk5WRlRBSUtZVFROTk5JSVlLU0VOTkROSUlGVEtOSUZOVlZUVEtEQUZJRlNLTlJHSU1OTApESVRLS0ZEWUhFSFJQS0xDVkZLSUlOVFFZVk5TUEVLTUlEQVdQVE1ESVZBTElURQoKJmd0O3NlcXVlbmNlNF9DUCBoeXBvdGhldGljYWwgcHJvdGVpbiBbYW5vdGhlciB2aXJ1c10KTUxSSFNDVk1QUVFLTEtLUkZGRkxSUkxSS0lMUllGRlRDTkZMTkxGRklOUkVZTklFTklUTFNZTEtLRVJJUFZXS1RTRE1TTgpJVlJLV1dNRkhSS1RRTEVETklFSUtLRElRTFlIRkZZTkdMRklLVE5ZUFlWWUhJREtLS0tZREZORE1LVklZTFBBSUhNSFNLCgomZ3Q7c2VxdWVuY2U1IGh5cG90aGV0aWNhbCBwcm90ZWluIFthbm90aGVyIHZpcnVzXQpNTFJIU0NWTVBRUUtMS0tSRkZGTFJSTFJLSUxSWUZGVENORkxOTEZGSU5SRVlOSUVOSVRMU1lMS0tFUklQVldLVFNETVNOCklWUktXV01GSFJLVFFMRUROSUVJS0tESVFMWUhGRllOR0xGSUtUTllQWVZZSElES0tLS1lERk5ETUtWSVlMUEFJSE1IU0sKCiZndDtzZXF1ZW5jZTYgfGh5cG90aGV0aWNhbCBwcm90ZWluW3ZpcnVzXQpNUUNLU0dUTk5WRlRBSUtZVFROTk5JSVlLU0VOTkROSUlGVEtOSUZOVlZUVEtEQUZJRlNLTlJHSU1OTEQKSVRLS0ZEWUhFSFJQS0xDVkZLSUlOVFFZVk5TUEVLTUlEQVdQVE1ESVZBTElURQoKJmd0O3NlcXVlbmNlNyB8aHlwb3RoZXRpY2FsIHByb3RlaW5bdmlydXNdCk1RQ0tTR1ROTlZGVEFJS1lUVE5OTklJWUtTRU5ORE5JSUZUS05JRk5WVlRUS0RBRklGU0tOUkdJTU5MRApJVEtLRkRZSEVIUlBLTENWRktJSU5UUVlWTlNQRUtNSURBV1BUTURJVkFMSVRF
>sequence1_CP [seq virus]
MQCKSGTNNVFTAIKYTTNNNIIYKSENNDNIIFTKNIFNVVTTKDAFIFSKNRGIMNL
DITKKFDYHEHRPKLCVFKIINTQYVNSPEKMIDAWPTMDIVALITE
>sequence2 [virus]
MQCKSGTNNVFTAIKYTTNNNIIYKSENNDNIIFTKNIFNVVTTKDAFIFSKNRGIMNL
DITKKFDYHEHRPKLCVFKIINTQYVNSPEKMIDAWPTMDIVALITE
>sequence3
MQCKSGTNNVFTAIKYTTNNNIIYKSENNDNIIFTKNIFNVVTTKDAFIFSKNRGIMNL
DITKKFDYHEHRPKLCVFKIINTQYVNSPEKMIDAWPTMDIVALITE
>sequence4_CP hypothetical protein [another virus]
MLRHSCVMPQQKLKKRFFFLRRLRKILRYFFTCNFLNLFFINREYNIENITLSYLKKERIPVWKTSDMSN
IVRKWWMFHRKTQLEDNIEIKKDIQLYHFFYNGLFIKTNYPYVYHIDKKKKYDFNDMKVIYLPAIHMHSK
>sequence5 hypothetical protein [another virus]
MLRHSCVMPQQKLKKRFFFLRRLRKILRYFFTCNFLNLFFINREYNIENITLSYLKKERIPVWKTSDMSN
IVRKWWMFHRKTQLEDNIEIKKDIQLYHFFYNGLFIKTNYPYVYHIDKKKKYDFNDMKVIYLPAIHMHSK
>sequence6 |hypothetical protein[virus]
MQCKSGTNNVFTAIKYTTNNNIIYKSENNDNIIFTKNIFNVVTTKDAFIFSKNRGIMNLD
ITKKFDYHEHRPKLCVFKIINTQYVNSPEKMIDAWPTMDIVALITE
>sequence7 |hypothetical protein[virus]
MQCKSGTNNVFTAIKYTTNNNIIYKSENNDNIIFTKNIFNVVTTKDAFIFSKNRGIMNLD
ITKKFDYHEHRPKLCVFKIINTQYVNSPEKMIDAWPTMDIVALITE