<?xml version="1.0" encoding="UTF-8"?>
<RUN_SET xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
  <RUN alias="dbb76854faeb6cdde9ab4f34c577c0bc" center_name="Broad Institute" broker_name="UM-SPH" run_center="Broad Institute" accession="SRR5088801">
    <IDENTIFIERS>
      <PRIMARY_ID>SRR5088801</PRIMARY_ID>
      <SUBMITTER_ID namespace="Broad Institute">dbb76854faeb6cdde9ab4f34c577c0bc</SUBMITTER_ID>
    </IDENTIFIERS>
    <TITLE>Secondary mapping Build 37 for NWD423324 [41045]</TITLE>
    <EXPERIMENT_REF accession="SRX2211103" refname="NWD423324-expt" refcenter="Broad Institute"/>
    <PROCESSING>
      <PIPELINE>
        <PIPE_SECTION section_name="read mapping">
          <STEP_INDEX>none</STEP_INDEX>
          <PREV_STEP_INDEX>NIL</PREV_STEP_INDEX>
          <PROGRAM>bwa mem</PROGRAM>
          <VERSION>0.7.7-r441</VERSION>
          <NOTES>1000 Genomes hs37d5 reference sequence</NOTES>
        </PIPE_SECTION>
        <PIPE_SECTION section_name="sort / merge / mark duplicates">
          <STEP_INDEX>new</STEP_INDEX>
          <PREV_STEP_INDEX>none</PREV_STEP_INDEX>
          <PROGRAM>Picard</PROGRAM>
          <VERSION>(varies)</VERSION>
          <NOTES/>
        </PIPE_SECTION>
        <PIPE_SECTION section_name="realign around indels">
          <STEP_INDEX>yes</STEP_INDEX>
          <PREV_STEP_INDEX>new</PREV_STEP_INDEX>
          <PROGRAM>GATK IndelRealigner</PROGRAM>
          <VERSION>3.3</VERSION>
          <NOTES>knownAlleles=[ (RodBinding name=knownAlleles source=Homo_sapiens_assembly19.dbsnp.vcf), (RodBinding name=knownAlleles2 source=Homo_sapiens_assembly19.known_indels.vcf), (RodBinding name=knownAlleles3 source=Homo_sapiens_assembly19.variantEvalGoldStandard.vcf)], targetIntervals = sample-specific</NOTES>
        </PIPE_SECTION>
        <PIPE_SECTION section_name="recalibrate base call quality scores">
          <STEP_INDEX>old</STEP_INDEX>
          <PREV_STEP_INDEX>yes</PREV_STEP_INDEX>
          <PROGRAM>GATK BaseRecalibrator</PROGRAM>
          <VERSION>3.3</VERSION>
          <NOTES>--useOriginalQualities -knownSites Homo_sapiens_assembly19.dbsnp.vcf -knownSites Homo_sapiens_assembly19.known_indels.vcf -knownSites Homo_sapiens_assembly19.variantEvalGoldStandard.vcf</NOTES>
        </PIPE_SECTION>
        <PIPE_SECTION section_name="compress base call quality scores">
          <STEP_INDEX>done</STEP_INDEX>
          <PREV_STEP_INDEX>old</PREV_STEP_INDEX>
          <PROGRAM>bamUtils squeeze</PROGRAM>
          <VERSION>1.0.13</VERSION>
          <NOTES>--keepDups --binMid --binQualS 2,3,10,20,25,30,35,40,50</NOTES>
        </PIPE_SECTION>
        <PIPE_SECTION section_name="convert to .cram format">
          <STEP_INDEX>home</STEP_INDEX>
          <PREV_STEP_INDEX>done</PREV_STEP_INDEX>
          <PROGRAM>samtools view -C</PROGRAM>
          <VERSION>1.3.1 Using htslib 1.3.1</VERSION>
          <NOTES>genome reference sequence retrieved from: ftp://ftp.1000genomes.ebi.ac.uk/vol1/ftp/technical/reference/phase2_reference_assembly_sequence/hs37d5.fa.gz</NOTES>
        </PIPE_SECTION>
      </PIPELINE>
    </PROCESSING>
    <RUN_ATTRIBUTES>
      <RUN_ATTRIBUTE>
        <TAG>assembly</TAG>
        <VALUE>GRCh37</VALUE>
      </RUN_ATTRIBUTE>
      <RUN_ATTRIBUTE>
        <TAG>options</TAG>
        <VALUE>--defer-secondary</VALUE>
      </RUN_ATTRIBUTE>
    </RUN_ATTRIBUTES>
  </RUN>
</RUN_SET>
