github.com/informationsea/shellflow@v0.1.3/docs/source/example.rst (about)

     1  Examples
     2  ========
     3  
     4  Build C program
     5  ---------------
     6  
     7  .. code:: bash
     8  
     9      cc -o [[lib1.o]] ((lib1.c)) # ((lib1.h))
    10      cc -o [[lib2.o]] ((lib2.c)) # ((lib2.h))
    11      cc -o [[main.o]] ((main.c)) # ((lib1.h)) ((lib2.h))
    12      cc -o [[program]] ((lib1.o)) ((lib2.o)) ((main.o))
    13  
    14  .. figure:: ./images/example1.png
    15     :alt: Dependecy graph
    16  
    17     Dependecy graph
    18  
    19  Prepare hs37d5 index file
    20  -------------------------
    21  
    22  .. code:: bash
    23  
    24      curl -o [[hs37d5.fa.gz]] -L ftp://ftp.1000genomes.ebi.ac.uk/vol1/ftp/technical/reference/phase2_reference_assembly_sequence/hs37d5.fa.gz
    25      gzip -dc ((hs37d5.fa.gz)) > [[hs37d5.fa]]
    26      bwa index ((hs37d5.fa)) # [[hs37d5.fa.bwt]]
    27  
    28  .. figure:: ./images/example2.png
    29     :alt: Dependecy graph
    30  
    31     Dependecy graph
    32  
    33  Analyze simulated FASTQ with GATK
    34  ---------------------------------
    35  
    36  .. code:: bash
    37  
    38      #% GATK_VERSION = "4.0.10.1"
    39      #% BWA_VERSION = "0.7.17"
    40      #% SAMTOOLS_VERSION = "1.9"
    41  
    42      # Generate simulation FASTQ
    43      python3 ((create-mutated-fasta.py)) ((e-coli-NC_011750.1.fasta)) --output [[e-coli-NC_011750.1-mutated-base.fasta]] --seed 123
    44      for i in 1 2; do
    45          python3 ((create-mutated-fasta.py)) ((e-coli-NC_011750.1-mutated-base.fasta)) --output [[e-coli-NC_011750.1-mutated{{i}}.fasta]] --seed 123{{i}}
    46          art_bin_MountRainier/art_illumina -ss HS25 -i ((e-coli-NC_011750.1-mutated{{i}}.fasta)) -p -l 150 -f 20 -m 200 -s 10 -o generated{{i}} # [[generated{{i}}1.fq]] [[generated{{i}}2.fq]]
    47          for j in 1 2; do
    48              sed -e 's/@/@{{i}}-/g' ((generated{{i}}{{j}}.fq))|gzip -c > [[generated{{i}}{{j}}-fix.fq.gz]]
    49          done
    50      done
    51  
    52      # Mapping
    53      for i in 1 2; do
    54          bwa-{{BWA_VERSION}}/bwa mem -R "@RG\tID:ECOLI-SIM\tSM:ECOLI_SIM\tPL:illumina\tLB:ECOLI_SIM" e-coli-NC_011750.1.fasta ((generated{{i}}1-fix.fq.gz)) ((generated{{i}}2-fix.fq.gz))|samtools-{{SAMTOOLS_VERSION}}/samtools sort -o [[generated{{i}}.bam]] - # ((e-coli-NC_011750.1.fasta.bwt))
    55          gatk-{{GATK_VERSION}}/gatk --java-options "-Xmx4G" MarkDuplicates -I ((generated{{i}}.bam)) -O [[generated{{i}}-markdup.bam]] -M [[generated{{i}}-markdup-metrics.txt]]
    56          gatk-{{GATK_VERSION}}/gatk --java-options "-Xmx4G" BaseRecalibrator -I ((generated{{i}}-markdup.bam)) -O [[generated{{i}}-bqsr.txt]] -R ((e-coli-NC_011750.1.fasta)) --known-sites ((empty.vcf.gz)) # ((e-coli-NC_011750.1.dict))
    57      done
    58  
    59      gatk-{{GATK_VERSION}}/gatk --java-options "-Xmx4G" GatherBQSRReports -I ((generated1-bqsr.txt)) -I ((generated2-bqsr.txt)) -O [[generated-bqsr-merged.txt]]
    60  
    61      # Apply BQSR
    62      for i in 1 2; do
    63          gatk-{{GATK_VERSION}}/gatk --java-options "-Xmx4G" ApplyBQSR -R ((e-coli-NC_011750.1.fasta)) -I ((generated{{i}}-markdup.bam)) -O [[generated{{i}}-recal.bam]] --bqsr-recal-file ((generated-bqsr-merged.txt)) # ((e-coli-NC_011750.1.dict))
    64      done
    65  
    66      # Merge
    67  
    68      samtools-{{SAMTOOLS_VERSION}}/samtools merge -f [[generated-merged.bam]] ((generated1-recal.bam)) ((generated2-recal.bam))
    69      samtools-{{SAMTOOLS_VERSION}}/samtools index ((generated-merged.bam)) # [[generated-merged.bam.bai]]
    70  
    71      # Variant call
    72      gatk-{{GATK_VERSION}}/gatk --java-options "-Xmx4g" HaplotypeCaller -R ((e-coli-NC_011750.1.fasta)) -I ((generated-merged.bam)) -O [[generated-call.vcf.gz]] -ERC GVCF -bamout [[generated-merged-realigned.bam]] # ((e-coli-NC_011750.1.dict)) ((generated-merged.bam.bai))
    73      gatk-{{GATK_VERSION}}/gatk --java-options "-Xmx4g" GenotypeGVCFs -R ((e-coli-NC_011750.1.fasta)) -V ((generated-call.vcf.gz)) -O [[generated-call-result.vcf.gz]] # ((e-coli-NC_011750.1.dict))
    74  
    75  .. figure:: ./images/example3.png
    76     :alt: dependecy graph
    77  
    78     dependecy graph