Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- /*
- * PREPROCESSING - Prepare genome intervals for filtering
- */
- blacklistChannel = Channel.fromPath(params.blacklist)
- process makeGenomeFilter {
- tag "$fasta"
- publishDir "${params.outdir}/reference_genome", mode: 'copy'
- input:
- file fasta from fasta_genome_filter
- each file(blacklistFile) from blacklistChannel
- output:
- file "$fasta" into genome_fasta // FASTA FILE FOR IGV
- file "*.fai" into genome_fai // FAI INDEX FOR REFERENCE GENOME
- file "*.txt" into genome_autosomes // TEXT FILE CONTAINING LISTING OF AUTOSOMAL CHROMOSOMES FOR ATAQV
- file "*.bed" into genome_filter_regions // BED FILE WITHOUT BLACKLIST REGIONS & MITOCHONDRIAL CONTIG FOR FILTERING
- file "*.sizes" into genome_sizes_mlib_bigwig, // CHROMOSOME SIZES FILE FOR BEDTOOLS
- genome_sizes_mrep_bigwig
- script:
- blacklist_filter = params.blacklist ? "sortBed -i ${blacklistFile} -g ${fasta}.sizes | complementBed -i stdin -g ${fasta}.sizes" : "awk '{print \$1, '0' , \$2}' OFS='\t' ${fasta}.sizes"
- name_filter = params.mito_name ? "| awk '\$1 !~ /${params.mito_name}/ {print \$0}'": ""
- mito_filter = params.keepMito ? "" : name_filter
- """
- samtools faidx $fasta
- get_autosomes.py ${fasta}.fai ${fasta}.autosomes.txt
- cut -f 1,2 ${fasta}.fai > ${fasta}.sizes
- $blacklist_filter $mito_filter > ${fasta}.include_regions.bed
- """
- }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement