<?xml version="1.0" encoding="UTF-8"?>
<RUN_SET xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
  <RUN alias="54ea523ea3362929f685547d9a57c6fb" center_name="Broad Institute" broker_name="UM-SPH" run_center="Broad Institute" accession="SRR3203790">
    <IDENTIFIERS>
      <PRIMARY_ID>SRR3203790</PRIMARY_ID>
      <SUBMITTER_ID namespace="Broad Institute">54ea523ea3362929f685547d9a57c6fb</SUBMITTER_ID>
    </IDENTIFIERS>
    <TITLE>Secondary mapping Build 37 for NWD223081 [13466]</TITLE>
    <EXPERIMENT_REF accession="SRX1608897" refname="NWD223081-expt" refcenter="Broad Institute"/>
    <PROCESSING>
      <PIPELINE>
        <PIPE_SECTION section_name="read mapping">
          <STEP_INDEX> none </STEP_INDEX>
          <PREV_STEP_INDEX>NIL</PREV_STEP_INDEX>
          <PROGRAM> bwa mem </PROGRAM>
          <VERSION> 0.7.7-r441 </VERSION>
          <NOTES/>
        </PIPE_SECTION>
        <PIPE_SECTION section_name="sort / merge / mark duplicates">
          <STEP_INDEX> new </STEP_INDEX>
          <PREV_STEP_INDEX> none </PREV_STEP_INDEX>
          <PROGRAM> Picard </PROGRAM>
          <VERSION> (varies) </VERSION>
          <NOTES/>
        </PIPE_SECTION>
        <PIPE_SECTION section_name="realign around indels">
          <STEP_INDEX> yes </STEP_INDEX>
          <PREV_STEP_INDEX> new </PREV_STEP_INDEX>
          <PROGRAM> GATK IndelRealigner </PROGRAM>
          <VERSION> 3.3 </VERSION>
          <NOTES> knownAlleles=[        (RodBinding name=knownAlleles source=Homo_sapiens_assembly19.dbsnp.vcf),         (RodBinding name=knownAlleles2 source=Homo_sapiens_assembly19.known_indels.vcf),         (RodBinding name=knownAlleles3 source=Homo_sapiens_assembly19.variantEvalGoldStandard.vcf)],         targetIntervals = sample-specific </NOTES>
        </PIPE_SECTION>
        <PIPE_SECTION section_name="recalibrate base call quality scores">
          <STEP_INDEX> old </STEP_INDEX>
          <PREV_STEP_INDEX> yes </PREV_STEP_INDEX>
          <PROGRAM> GATK BaseRecalibrator </PROGRAM>
          <VERSION> 3.3 </VERSION>
          <NOTES> --useOriginalQualities        -knownSites Homo_sapiens_assembly19.dbsnp.vcf          -knownSites Homo_sapiens_assembly19.known_indels.vcf          -knownSites Homo_sapiens_assembly19.variantEvalGoldStandard.vcf </NOTES>
        </PIPE_SECTION>
        <PIPE_SECTION section_name="compress base call quality scores">
          <STEP_INDEX> done </STEP_INDEX>
          <PREV_STEP_INDEX> old </PREV_STEP_INDEX>
          <PROGRAM> bamUtils squeeze </PROGRAM>
          <VERSION> 1.0.13 </VERSION>
          <NOTES> --keepDups  --binMid  --binQualS 2,3,10,20,25,30,35,40,50  </NOTES>
        </PIPE_SECTION>
        <PIPE_SECTION section_name="convert to .cram format">
          <STEP_INDEX> home </STEP_INDEX>
          <PREV_STEP_INDEX> done </PREV_STEP_INDEX>
          <PROGRAM> samtools view -C </PROGRAM>
          <VERSION> 1.2 Using htslib 1.2.1 </VERSION>
          <NOTES> genome reference sequence retrieved from:  ftp://ftp.1000genomes.ebi.ac.uk/vol1/ftp/technical/reference/phase2_reference_assembly_sequence/hs37d5.fa.gz </NOTES>
        </PIPE_SECTION>
      </PIPELINE>
    </PROCESSING>
    <RUN_ATTRIBUTES>
      <RUN_ATTRIBUTE>
        <TAG>assembly</TAG>
        <VALUE>GRCh37</VALUE>
      </RUN_ATTRIBUTE>
      <RUN_ATTRIBUTE>
        <TAG>Alignment Provider</TAG>
        <VALUE>Sequencing Center</VALUE>
      </RUN_ATTRIBUTE>
    </RUN_ATTRIBUTES>
  </RUN>
</RUN_SET>
