Mox Fastqc And Minia

Playing around a bit with Mox (crippled by lack of disk space). Ran FastQC

#!/bin/bash
## Job Name
#SBATCH --job-name=fastqc-NS
## Allocation Definition 
#SBATCH --account=srlab
#SBATCH --partition=srlab
## Resources
## Nodes (We only get 1, so this is fixed)
#SBATCH --nodes=1   
## Walltime (days-hours:minutes:seconds format)
#SBATCH --time=24:00:00
## Memory per node
#SBATCH --mem=500G
## Specify the working directory for this job
#SBATCH --workdir=/gscratch/srlab/sr320/analyses/0901

 
source /gscratch/srlab/programs/scripts/paths.sh

/gscratch/srlab/programs/FastQC/fastqc \
-t 28 \
/gscratch/scrubbed/sr320/AD002_S9_L001_R1_001.fastq.gz 

and minia (note location)

#!/bin/bash
## Job Name
#SBATCH --job-name=minia
## Allocation Definition 
#SBATCH --account=srlab
#SBATCH --partition=srlab
## Resources
## Nodes (We only get 1, so this is fixed)
#SBATCH --nodes=1   
## Walltime (days-hours:minutes:seconds format)
#SBATCH --time=100:00:00
## Memory per node
#SBATCH --mem=500G
## Specify the working directory for this job
#SBATCH --workdir=/gscratch/srlab/sr320/analyses/0901b

 
source /gscratch/srlab/programs/scripts/paths.sh

/gscratch/srlab/sr320/programs/minia-v2.0.7-bin-Linux/bin/minia \
-nb-cores 28 \
-max-memory 500000 \
-in /gscratch/scrubbed/sr320/AD002_S9_L001_R2_001.fastq.gz \
-out-dir /gscratch/scrubbed/sr320/

minia seems to create a lot of temporary files (probably could have wrote to scrubbed)

[sr320@mox1 0901b]$ ls
slurm-71843.out			       trashme_32333_dsk_partitions.parts.20  trashme_32333_dsk_partitions.parts.34  trashme_32333_dsk_partitions.parts.48
slurm-71844.out			       trashme_32333_dsk_partitions.parts.21  trashme_32333_dsk_partitions.parts.35  trashme_32333_dsk_partitions.parts.49
trashme_32333_dsk_partitions.parts.0   trashme_32333_dsk_partitions.parts.22  trashme_32333_dsk_partitions.parts.36  trashme_32333_dsk_partitions.parts.5
trashme_32333_dsk_partitions.parts.1   trashme_32333_dsk_partitions.parts.23  trashme_32333_dsk_partitions.parts.37  trashme_32333_dsk_partitions.parts.50
trashme_32333_dsk_partitions.parts.10  trashme_32333_dsk_partitions.parts.24  trashme_32333_dsk_partitions.parts.38  trashme_32333_dsk_partitions.parts.51
trashme_32333_dsk_partitions.parts.11  trashme_32333_dsk_partitions.parts.25  trashme_32333_dsk_partitions.parts.39  trashme_32333_dsk_partitions.parts.52
trashme_32333_dsk_partitions.parts.12  trashme_32333_dsk_partitions.parts.26  trashme_32333_dsk_partitions.parts.4   trashme_32333_dsk_partitions.parts.53
trashme_32333_dsk_partitions.parts.13  trashme_32333_dsk_partitions.parts.27  trashme_32333_dsk_partitions.parts.40  trashme_32333_dsk_partitions.parts.54
trashme_32333_dsk_partitions.parts.14  trashme_32333_dsk_partitions.parts.28  trashme_32333_dsk_partitions.parts.41  trashme_32333_dsk_partitions.parts.55
trashme_32333_dsk_partitions.parts.15  trashme_32333_dsk_partitions.parts.29  trashme_32333_dsk_partitions.parts.42  trashme_32333_dsk_partitions.parts.6
trashme_32333_dsk_partitions.parts.16  trashme_32333_dsk_partitions.parts.3   trashme_32333_dsk_partitions.parts.43  trashme_32333_dsk_partitions.parts.7
trashme_32333_dsk_partitions.parts.17  trashme_32333_dsk_partitions.parts.30  trashme_32333_dsk_partitions.parts.44  trashme_32333_dsk_partitions.parts.8
trashme_32333_dsk_partitions.parts.18  trashme_32333_dsk_partitions.parts.31  trashme_32333_dsk_partitions.parts.45  trashme_32333_dsk_partitions.parts.9
trashme_32333_dsk_partitions.parts.19  trashme_32333_dsk_partitions.parts.32  trashme_32333_dsk_partitions.parts.46
trashme_32333_dsk_partitions.parts.2   trashme_32333_dsk_partitions.parts.33  trashme_32333_dsk_partitions.parts.47
[sr320@mox1 0901b]$ tail slurm-71844.out 
[DSK: Collecting stats on AD002_S9_L... ]  100  %   elapsed:   0 min 47 sec    estimated remaining:   0 min 0  sec   cpu:  243.5 %   mem: [  73,   73,   73] MB 
[DSK: Pass 1/1, Step 2: counting kmers  ]  82.8 %   elapsed:  17 min 8  sec    estimated remaining:   3 min 34 sec   cpu:  368.9 %   mem: [43863, 43863, 43865] MB

slurm tail

minia                                   
    -nb-cores                                : 28
    -max-memory                              : 500000
    -in                                      : /gscratch/scrubbed/sr320/AD002_S9_L001_R2_001.fastq.gz
    -out-dir                                 : /gscratch/scrubbed/sr320/
    -traversal                               : contig
    -starter                                 : best
    -contig-max-len                          : 10000000
    -bfs-max-depth                           : 500
    -bfs-max-breadth                         : 20
    -fasta-line                              : 0
    -kmer-size                               : 31
    -abundance-min                           : 3
    -abundance-max                           : 4294967295
    -histo-max                               : 10000
    -solidity-kind                           : sum
    -max-disk                                : 0
    -minimizer-type                          : 0
    -minimizer-size                          : 8
    -repartition-type                        : 0
    -bloom                                   : neighbor
    -debloom                                 : cascading
    -debloom-impl                            : minimizer
    -branching-nodes                         : stored
    -topology-stats                          : 0
    -mphf                                    : emphf
    -verbose                                 : 1
    -integer-precision                       : 0
    -verbose                                 : 1
    stats                                   
        traversal                                : contig
        start_selector                           : best
        nb_contigs                               : 8044789
        nb_small_contigs_discarded               : 9241683
        nt_assembled                             : 1160242262
        max_length                               : 5239
        max_length_left                          : 4197
        max_length_right                         : 4855
        debugging traversal stats               
        large breadth                            : 1344
        large depth                              : 135
        marked kmer inside traversal             : 5595051
        traversal ends with dead-ends            : 2587076
        in-branching large depth                 : 2178233
        in-branching large breadth               : 2196283
        in-branching other                       : 3276932
        couldn't validate consensuses            : 154210
    time                                     : 36742.777
        assembly                                 : 36742.777

and

[sr320@mox1 0901b]$ ls
AD002_S9_L001_R2_001.contigs.fa  slurm-71843.out  slurm-71844.out
[sr320@mox1 0901b]$ head AD002_S9_L001_R2_001.contigs.fa 
>0__len__91
AAAAAAAAAAAAAAAAAAAAAAAAAACCTCACAAGCTTTGACATATTAATGTTACACTTATTGGTGTACTTAAAAGAAATTACTAGTATAC
>1__len__126
AAAAAAAAAAAAAAAAAAAAAAAAAAACTGCCAGCCAATTAACACAAATTTATAAAATATAATCAGTGACTTAATACATGGGATAGATACGGTGACATTAAGGGATGTGTATTCAGAGCTGTCAAT
>2__len__461
AAAAAAAAAAAAAAAAAAAAAAAAAACGATTTCAGATTGAAATGTAAATATGTTAAGATGCAGCATATTATTTCACATCAACATAAGGTCAAACCTTTGGCAGGTTCGACATGATGATTAATCAAAATATGTTTTGAAATGTATATATACAGGTAACATTGGGTTTATATATATAAACATAATTAAACCCAATGTTGTTGTCTGAAATTCCGGGACTTAGATAAAACAAAAGTTGTATATTTTCCACAGTGAACTATGGTAAAATGGTAAAAACATACATCTTTCTTATTCTTACAGTCCATGGTTGGATTTCTCCATCTTCTTCAAATGGAAATAGAATATATCGTCCTTTTAAAAGTATTATCCTGTACTTTTACAAATCAGACACAATTCATACTTCCGCTCGTCCTCGGTAACAGTTCTTTGTAATAGTGTTACTACTGTCCTTCCTAAAAAAGAAA
>3__len__84
AAAAAAAAAAAAAAAAAAAAAAAAAACGTTGACAAATATGAAAGCAGCATTTTTTCAAATAAAAGCACTGTTTGTCTAGTTAAA
>4__len__101
AAAAAAAAAAAAAAAAAAAAAAAAAATCGGAAAAATACTAATTTCGAAAATTAAAAGGAATGTTAAGGGGCGTGTTAGTTATAACAGCGGAAAAGGTTTCT
Written on September 1, 2017