2024-10-17 17:56:12 +00:00
|
|
|
name: make_reference
|
|
|
|
|
namespace: reference
|
|
|
|
|
description: |
|
|
|
|
|
Preprocess and build a transcriptome reference.
|
|
|
|
|
|
|
|
|
|
Example input files are:
|
|
|
|
|
- `genome_fasta`: https://ftp.ebi.ac.uk/pub/databases/gencode/Gencode_human/release_41/GRCh38.primary_assembly.genome.fa.gz
|
|
|
|
|
- `transcriptome_gtf`: https://ftp.ebi.ac.uk/pub/databases/gencode/Gencode_human/release_41/gencode.v41.annotation.gtf.gz
|
|
|
|
|
- `ercc`: https://assets.thermofisher.com/TFS-Assets/LSG/manuals/ERCC92.zip
|
|
|
|
|
authors:
|
|
|
|
|
- __merge__: /src/authors/angela_pisco.yaml
|
|
|
|
|
roles: [ author ]
|
|
|
|
|
- __merge__: /src/authors/robrecht_cannoodt.yaml
|
|
|
|
|
roles: [ author, maintainer ]
|
|
|
|
|
arguments:
|
|
|
|
|
# inputs
|
|
|
|
|
- type: file
|
|
|
|
|
name: --genome_fasta
|
|
|
|
|
required: true
|
|
|
|
|
description: "Reference genome fasta. Example: "
|
|
|
|
|
example: genome_fasta.fa.gz
|
|
|
|
|
- type: file
|
|
|
|
|
name: --transcriptome_gtf
|
|
|
|
|
required: true
|
|
|
|
|
description: Reference transcriptome annotation.
|
|
|
|
|
example: transcriptome.gtf.gz
|
|
|
|
|
- type: file
|
|
|
|
|
name: --ercc
|
|
|
|
|
description: ERCC sequence and annotation file.
|
|
|
|
|
example: ercc.zip
|
|
|
|
|
- type: string
|
|
|
|
|
name: --subset_regex
|
|
|
|
|
description: Will subset the reference chromosomes using the given regex.
|
|
|
|
|
example: (ERCC-00002|chr1)
|
|
|
|
|
- type: file
|
|
|
|
|
name: --output_fasta
|
|
|
|
|
direction: output
|
|
|
|
|
required: true
|
|
|
|
|
description: Output genome sequence fasta.
|
|
|
|
|
example: genome_sequence.fa.gz
|
|
|
|
|
- type: file
|
|
|
|
|
name: --output_gtf
|
|
|
|
|
direction: output
|
|
|
|
|
required: true
|
|
|
|
|
description: Output transcriptome annotation gtf.
|
|
|
|
|
example: transcriptome_annotation.gtf.gz
|
|
|
|
|
resources:
|
|
|
|
|
- type: bash_script
|
|
|
|
|
path: script.sh
|
|
|
|
|
test_resources:
|
|
|
|
|
- type: bash_script
|
2024-11-15 14:37:33 +00:00
|
|
|
path: test.sh
|
2024-10-17 17:56:12 +00:00
|
|
|
engines:
|
|
|
|
|
- type: docker
|
|
|
|
|
image: ubuntu:22.04
|
|
|
|
|
setup:
|
|
|
|
|
- type: apt
|
|
|
|
|
packages: [ pigz, seqkit, curl, wget, unzip, file]
|
|
|
|
|
runners:
|
|
|
|
|
- type: executable
|
|
|
|
|
- type: nextflow
|
|
|
|
|
directives:
|
|
|
|
|
label: [ highmem, highcpu ]
|