Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
25 changes: 0 additions & 25 deletions data/templates/0.mapping_minimap2_db.sbatch

This file was deleted.

4 changes: 3 additions & 1 deletion data/templates/1.hifiasm-meta_new.sbatch
Original file line number Diff line number Diff line change
Expand Up @@ -8,10 +8,12 @@
#SBATCH -o {{output}}/step-1/logs/%x-%A_%a.out
#SBATCH -e {{output}}/step-1/logs/%x-%A_%a.out
#SBATCH --array {{array_params}}

source ~/.bashrc
set -e
conda activate {{conda_environment}}

cd {{output}}/step-1

step=${SLURM_ARRAY_TASK_ID}
input=$(head -n $step {{output}}/sample_list.txt | tail -n 1)

Expand Down
3 changes: 1 addition & 2 deletions data/templates/2.get-circular-genomes.sbatch
Original file line number Diff line number Diff line change
Expand Up @@ -10,9 +10,8 @@
#SBATCH --array {{array_params}}

source ~/.bashrc

set -e
conda activate {{conda_environment}}

cd {{output}}/step-1

step=${SLURM_ARRAY_TASK_ID} ##1000_2, 1000_1
Expand Down
1 change: 1 addition & 0 deletions data/templates/3.minimap2_assembly.sbatch
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@
#SBATCH --array {{array_params}}

source ~/.bashrc
set -e
conda activate {{conda_environment}}
cd {{output}}

Expand Down
2 changes: 1 addition & 1 deletion data/templates/4.metawrap_binning_new.sbatch
Original file line number Diff line number Diff line change
Expand Up @@ -10,8 +10,8 @@
#SBATCH --array {{array_params}}

source ~/.bashrc
set -e
conda activate {{conda_environment}}

cd {{output}}

step=${SLURM_ARRAY_TASK_ID}
Expand Down
4 changes: 2 additions & 2 deletions data/templates/5.DAS_Tools_prepare_batch3_test.sbatch
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@
#SBATCH --array {{array_params}}

source ~/.bashrc

set -e
conda activate {{conda_environment}}
cd {{output}}

Expand All @@ -35,4 +35,4 @@ Fasta_to_Contig2Bin.sh -i ./concoct_bins -e fa > ${sample_name}.concoct.tsv
Fasta_to_Contig2Bin.sh -i ./maxbin2_bins -e fa > ${sample_name}.maxbin2.tsv
Fasta_to_Contig2Bin.sh -i ./metabat2_bins -e fa > ${sample_name}.metabat2.tsv

DAS_Tool --bins=${sample_name}.concoct.tsv,${sample_name}.maxbin2.tsv,${sample_name}.metabat2.tsv --contigs={{output}}/step-2/${sample_name}_noLCG.fa --outputbasename={{output}}/${folder}/${sample_name}/${sample_name} --labels=CONCOCT,MaxBin,MetaBAT --threads={{nprocs}} --search_engine=diamond --dbDirectory=${DAS_db} --write_bins
DAS_Tool --bins=${sample_name}.concoct.tsv,${sample_name}.maxbin2.tsv,${sample_name}.metabat2.tsv --contigs={{output}}/step-2/${sample_name}_noLCG.fa --outputbasename={{output}}/${folder}/${sample_name}/${sample_name} --labels=CONCOCT,MaxBin,MetaBAT --threads={{nprocs}} --search_engine=diamond --dbDirectory=${DAS_db} --write_bins
1 change: 1 addition & 0 deletions data/templates/6.MAG_rename.sbatch
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@
#SBATCH --array {{array_params}}

source ~/.bashrc
set -e
conda activate {{conda_environment}}
cd {{output}}

Expand Down
3 changes: 1 addition & 2 deletions data/templates/7.checkm_batch.sbatch
Original file line number Diff line number Diff line change
Expand Up @@ -11,9 +11,8 @@


source ~/.bashrc

set -e
conda activate {{conda_environment}}

cd {{output}}

step=${SLURM_ARRAY_TASK_ID}
Expand Down
32 changes: 32 additions & 0 deletions data/templates/woltka_minimap2.sbatch
Original file line number Diff line number Diff line change
@@ -0,0 +1,32 @@
#!/bin/bash
#SBATCH -J {{job_name}}
#SBATCH -p qiita
#SBATCH -N {{node_count}}
#SBATCH -n {{nprocs}}
#SBATCH --time {{wall_time_limit}}
#SBATCH --mem {{mem_in_gb}}G
#SBATCH -o {{output}}/minimap2/logs/%x-%A_%a.out
#SBATCH -e {{output}}/minimap2/logs/%x-%A_%a.out
#SBATCH --array {{array_params}}

source ~/.bashrc
set -e
conda activate {{conda_environment}}
mkdir -p {{output}}/alignments
cd {{output}}/
db=/ddn_scratch/qiita_t/working_dir/tmp/db/WoLr2.mmi

step=${SLURM_ARRAY_TASK_ID}
input=$(head -n $step {{output}}/sample_list.txt | tail -n 1)

sample_name=`echo $input | awk '{print $1}'`
filename=`echo $input | awk '{print $2}'`

fn=`basename ${filename}`

minimap2 -x map-hifi -t {{nprocs}} -a \
--secondary=no --MD --eqx ${db} \
${filename} | \
samtools sort -@ {{nprocs}} - | \
awk 'BEGIN { FS=OFS="\t" } /^@/ { print; next } { $10="*"; $11="*" } 1' | \
xz -1 -T1 > {{output}}/alignments/${sample_name}.sam.xz
49 changes: 49 additions & 0 deletions data/templates/woltka_minimap2_merge.sbatch
Original file line number Diff line number Diff line change
@@ -0,0 +1,49 @@
#!/bin/bash
#SBATCH -J {{job_name}}
#SBATCH -p qiita
#SBATCH -N {{node_count}}
#SBATCH -n {{nprocs}}
#SBATCH --time {{wall_time_limit}}
#SBATCH --mem {{mem_in_gb}}G
#SBATCH -o {{output}}/merge/logs/%x-%A_%a.out
#SBATCH -e {{output}}/merge/logs/%x-%A_%a.out

source ~/.bashrc
set -e
conda activate {{conda_environment}}
cd {{output}}/
tax=/projects/wol/qiyun/wol2/databases/minimap2/WoLr2.tax
coords=/projects/wol/qiyun/wol2/databases/minimap2/WoLr2.coords
len_map=/projects/wol/qiyun/wol2/databases/minimap2/WoLr2/length.map
functional_dir=/projects/wol/qiyun/wol2/databases/minimap2/WoLr2/

mkdir -p {{output}}/coverages/

for f in `ls alignments/*.sam.xz`; do
sn=`basename ${f/.sam.xz/}`;
of={{output}}/bioms/${sn};
mkdir -p ${of};
echo "woltka classify -i ${f} -o ${of}/none.biom --no-demux --lineage ${tax} --rank none --outcov {{output}}/coverages/";
echo "woltka classify -i ${f} -o ${of}/per-gene.biom --no-demux -c ${coords}";
done | parallel -j {{node_count}}
wait

for f in `ls bioms/*/per-gene.biom`; do
dn=`dirname ${f}`;
sn=`basename ${sn}`;
echo "woltka collapse -i ${f} -m ${functional_dir}/orf-to-ko.map.xz -o ${dn}/ko.biom; " \
"woltka collapse -i ${dn}/ko.biom -m ${functional_dir}/ko-to-ec.map -o ${dn}/ec.biom; " \
"woltka collapse -i ${dn}/ko.biom -m ${functional_dir}/ko-to-reaction.map -o ${dn}/reaction.biom; " \
"woltka collapse -i ${dn}/reaction.biom -m ${functional_dir}/reaction-to-module.map -o ${dn}/module.biom; " \
"woltka collapse -i ${dn}/module.biom -m ${functional_dir}/module-to-pathway.map -o ${dn}/pathway.biom;"
done | parallel -j {{node_count}}
wait

# MISSING:
# merge bioms!

find {{output}}/coverages/ -iname "*.cov" > {{output}}/cov_files.txt
micov consolidate --paths {{output}}/cov_files.txt --lengths ${len_map} --output {{output}}/coverages.tgz

cd alignments
tar -cvf ../alignments.tar *.sam.xz
38 changes: 35 additions & 3 deletions qp_pacbio/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,11 +6,43 @@
# The full license is in the file LICENSE, distributed with this software.
# -----------------------------------------------------------------------------
from qiita_client import QiitaPlugin, QiitaCommand
from .qp_pacbio import pacbio_processing
from .qp_pacbio import pacbio_processing, minimap2_processing
from .util import plugin_details

__version__ = "2025.9"

plugin = QiitaPlugin("qp-pacbio", __version__, "PacBio Processing")
plugin = QiitaPlugin(**plugin_details)

#
# minimap2 command
#

req_params = {'artifact_id': ('integer', ['per_sample_FASTQ'])}
opt_params = dict()
outputs = {
# taxonomic
'Per genome Predictions': 'BIOM',
'Per gene Predictions': 'BIOM',
# functional
'KEGG Ontology (KO)': 'BIOM',
'KEGG Enzyme (EC)': 'BIOM',
'KEGG Pathway': 'BIOM',
}
dflt_param_set = dict()

minimap2_cmd = QiitaCommand(
"Woltka v0.1.7, minimap2",
"Functional and Taxonomic Predictions",
minimap2_processing,
req_params,
opt_params,
outputs,
dflt_param_set,
)
plugin.register_command(minimap2_cmd)

#
# pacbio processing pipeline command
#

req_params = {
"artifact_id": ("integer", [None]),
Expand Down
Loading
Loading