You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

25 lines
800B

  1. import pandas as pd
  2. import sys, argparse, os
  3. from operator import itemgetter
  4. parser = argparse.ArgumentParser(description="this script is to annotate high confidence calls")
  5. parser.add_argument('-info', '--info', type=str, help='The infomation file', required=True)
  6. parser.add_argument('-vcf', '--vcf', type=str, help='The vcf file', required=True)
  7. parser.add_argument('-prefix', '--prefix', type=str, help='The outputname', required=True)
  8. args = parser.parse_args()
  9. # Rename input:
  10. info = args.info
  11. vcf = args.vcf
  12. prefix = args.prefix
  13. info = pd.read_table(info,header=None)
  14. vcf = pd.read_table(vcf,header=None)
  15. merged_df = pd.merge(vcf, info, how='inner', left_on=[0,1], right_on = [0,1])
  16. filename = prefix + '.annotated.txt'
  17. merged_df.to_csv(filename,header=None,index=None,sep="\t")