Build pipeline: vsh-ci-build-template-k4qzr
Source commit: 173327cc56
Source message: Cellranger multi conversion: fix combined AB + CB probe experiments (#1062)
119 lines
3.7 KiB
Bash
Executable File
119 lines
3.7 KiB
Bash
Executable File
#!/bin/bash
|
|
|
|
set -eo pipefail
|
|
|
|
# get the root of the directory
|
|
REPO_ROOT=$(git rev-parse --show-toplevel)
|
|
|
|
# ensure that the command below is run from the root of the repository
|
|
cd "$REPO_ROOT"
|
|
|
|
ID=pbmc_1k_protein_v3
|
|
OUT=resources_test/$ID/$ID
|
|
DIR=$(dirname "$OUT")
|
|
|
|
# ideally, this would be a versioned pipeline run
|
|
[ -d "$DIR" ] || mkdir -p "$DIR"
|
|
|
|
# dataset page:
|
|
# https://www.10xgenomics.com/resources/datasets/1-k-pbm-cs-from-a-healthy-donor-gene-expression-and-cell-surface-protein-3-standard-3-0-0
|
|
|
|
# download metrics summary
|
|
wget https://cf.10xgenomics.com/samples/cell-exp/3.0.0/pbmc_1k_protein_v3/pbmc_1k_protein_v3_metrics_summary.csv \
|
|
-O "${OUT}_metrics_summary.csv"
|
|
|
|
# download counts h5 file
|
|
wget https://cf.10xgenomics.com/samples/cell-exp/3.0.0/pbmc_1k_protein_v3/pbmc_1k_protein_v3_filtered_feature_bc_matrix.h5 \
|
|
-O "${OUT}_filtered_feature_bc_matrix.h5"
|
|
|
|
wget https://cf.10xgenomics.com/samples/cell-exp/3.0.0/pbmc_1k_protein_v3/pbmc_1k_protein_v3_raw_feature_bc_matrix.h5 \
|
|
-O "${OUT}_raw_feature_bc_matrix.h5"
|
|
|
|
# download counts matrix tar gz file
|
|
wget https://cf.10xgenomics.com/samples/cell-exp/3.0.0/pbmc_1k_protein_v3/pbmc_1k_protein_v3_filtered_feature_bc_matrix.tar.gz \
|
|
-O "${OUT}_filtered_feature_bc_matrix.tar.gz"
|
|
|
|
# extract matrix tar gz
|
|
mkdir -p "${OUT}_filtered_feature_bc_matrix"
|
|
tar -xvf "${OUT}_filtered_feature_bc_matrix.tar.gz" \
|
|
-C "${OUT}_filtered_feature_bc_matrix" \
|
|
--strip-components 1
|
|
rm "${OUT}_filtered_feature_bc_matrix.tar.gz"
|
|
|
|
# convert 10x h5 to h5mu
|
|
target/docker/convert/from_10xh5_to_h5mu/from_10xh5_to_h5mu \
|
|
--input "${OUT}_filtered_feature_bc_matrix.h5" \
|
|
--input_metrics_summary "${OUT}_metrics_summary.csv" \
|
|
--output "${OUT}_filtered_feature_bc_matrix.h5mu"
|
|
|
|
# run single sample
|
|
nextflow \
|
|
run . \
|
|
-main-script target/nextflow/workflows/rna/rna_singlesample/main.nf \
|
|
-c src/workflows/utils/labels_ci.config \
|
|
-profile docker \
|
|
--id pbmc_1k_protein_v3_uss \
|
|
--input "${OUT}_filtered_feature_bc_matrix.h5mu" \
|
|
--output "`basename $OUT`_uss.h5mu" \
|
|
--publishDir `dirname $OUT` \
|
|
-resume
|
|
|
|
# add the sample ID to the mudata object
|
|
nextflow \
|
|
run . \
|
|
-main-script target/nextflow/metadata/add_id/main.nf \
|
|
-c src/workflows/utils/labels_ci.config \
|
|
-profile docker \
|
|
--id pbmc_1k_protein_v3_uss \
|
|
--input "${OUT}_uss.h5mu" \
|
|
--input_id "pbmc_1k_protein_v3_uss" \
|
|
--output "`basename $OUT`_uss_with_id.h5mu" \
|
|
--output_compression "gzip" \
|
|
--publishDir `dirname $OUT` \
|
|
-resume
|
|
|
|
# run multisample
|
|
nextflow \
|
|
run . \
|
|
-main-script target/nextflow/workflows/rna/rna_multisample/main.nf \
|
|
-c src/workflows/utils/labels_ci.config \
|
|
-profile docker \
|
|
--id pbmc_1k_protein_v3_ums \
|
|
--input "${OUT}_uss_with_id.h5mu" \
|
|
--output "`basename $OUT`_ums.h5mu" \
|
|
--publishDir `dirname $OUT` \
|
|
-resume
|
|
|
|
rm "${OUT}_uss_with_id.h5mu"
|
|
|
|
# run dimred
|
|
nextflow \
|
|
run . \
|
|
-main-script target/nextflow/workflows/multiomics/dimensionality_reduction/main.nf \
|
|
-c src/workflows/utils/labels_ci.config \
|
|
-profile docker \
|
|
--id pbmc_1k_protein_v3_mms \
|
|
--input "${OUT}_ums.h5mu" \
|
|
--output "`basename $OUT`_mms.h5mu" \
|
|
--publishDir `dirname $OUT` \
|
|
--obs_covariates sample_id \
|
|
-resume
|
|
|
|
# run integration
|
|
nextflow \
|
|
run . \
|
|
-main-script target/nextflow/workflows/integration/harmony_leiden/main.nf \
|
|
-c src/workflows/utils/labels_ci.config \
|
|
-profile docker \
|
|
--id pbmc_1k_protein_v3_mms_integration \
|
|
--input "${OUT}_mms.h5mu" \
|
|
--output "`basename $OUT`_mms.h5mu" \
|
|
--publishDir `dirname $OUT` \
|
|
--obs_covariates sample_id \
|
|
-resume
|
|
|
|
python <<HEREDOC
|
|
import mudata as mu
|
|
mudata = mu.read_h5mu("${DIR}/pbmc_1k_protein_v3_filtered_feature_bc_matrix.h5mu")
|
|
mudata.mod["rna"].write_h5ad("${DIR}/pbmc_1k_protein_v3_filtered_feature_bc_matrix_rna.h5ad")
|
|
HEREDOC |