Skip to content

Commit

Permalink
Release v1.0
Browse files Browse the repository at this point in the history
  • Loading branch information
ArthurDondi committed Oct 7, 2024
1 parent ec1690b commit 9a259ff
Show file tree
Hide file tree
Showing 70 changed files with 1,801 additions and 3,443 deletions.
5 changes: 4 additions & 1 deletion .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,9 @@
#snakemake logs folders
.snakemake/
logs/
benchmarks/

#Large files
CTAT_LR_Fusion/ctat_lr_fusion.v0.10.0.simg
ctat_lr_fusion.v0.13.0.simg

*test*
187 changes: 88 additions & 99 deletions config/config.yaml
Original file line number Diff line number Diff line change
@@ -1,134 +1,123 @@
# LongSom config yaml file

# Change those values to yours
User:
input_dir: /path/to/input_dir
output_dir: /path/to/output_dir
sample_map: /path/to/sample_map.tsv
cancer_cell_type: HGSOC

# Change if you use a custom reference
Reference:
genome: /../ref/GRCh38_gencode_v44_CTAT_lib_Oct292023.plug-n-play/ctat_genome_lib_build_dir/ref_genome.fa
isoforms: /../ref/GRCh38_gencode_v44_CTAT_lib_Oct292023.plug-n-play/ctat_genome_lib_build_dir/ref_annot.gtf
gnomAD_db: /../ref/gnomAD_v4.1
RNA_editing: /../ref/AllEditingSites.hg38.txt.gz
PoN_SR: /../ref/PoN.scRNAseq.hg38.tsv.gz

# Change any of those to True if you want to run it, else False
Run:
# Create a PoN based on Normals
PoN: False
# Run cell type reannotation
reanno: True
CellTypeReannotation: True
# Run SNV calling with SComatic
scomatic: True
# Run SNV annotation with annovar
annovar: False
SNVCalling: True
# Run cell clustering with BnpC
bnpc: True
CellClustering: True
# Run fusion calling with CTAT-LR-Fusion
ctatfusion: True
FusionCalling: True
# Run CNV calling with InferCNV
infercnv: False
# Generate various plots
plot: False
# Run scDNA validation (DEV only)
scdna: False

Global:
outdir: /cluster/work/bewi/members/dondia/projects/long_reads_tree/LongSom_out/OvCa_LR
data: /cluster/work/bewi/members/dondia/projects/long_reads_tree/data/SComatic_input/OvCa_LR
qc: /cluster/work/bewi/members/dondia/projects/long_reads_tree/bin/LongSom/QC/scripts
scomatic: /cluster/work/bewi/members/dondia/projects/long_reads_tree/bin/LongSom/SComatic/scripts
bnpc: /cluster/work/bewi/members/dondia/projects/long_reads_tree/bin/LongSom/BnpC
annovar: /cluster/work/bewi/members/dondia/projects/long_reads_tree/bin/annovar
subread: /cluster/work/bewi/members/dondia/projects/long_reads_tree/bin/subread-2.0.6-source
infercnv: /cluster/work/bewi/members/dondia/projects/long_reads_tree/bin/LongSom/InferCNV
genome: /cluster/work/bewi/members/dondia/projects/ovarian_cancer/reference/hg38.fa
isoforms: /cluster/work/bewi/members/dondia/projects/ovarian_cancer/reference/gencode.v36.annotation.gtf
ids:
B486: ""
B497: ""
B500: ""
CNACalling: False

PoN:
celltypes:
Normal: ""
ids:
B486_Norm: ""
B500_Norm: ""
min_ac_cells: 1
min_ac_reads: 1
min_cells: 1
min_cell_types: 1

CellTypeReannotation:
cancer_ctype: HGSOC
noncancer_ctype: Non-HGSOC
ctypes: ['HGSOC', 'Non-HGSOC']
celltypes:
HGSOC: ""
Non-HGSOC: ""
ctype_column: Automated_Cell_type
chrM_contaminant: 'False'
### Cell Type Reannotation
Reanno:

BaseCellCounter:
min_mapping_quality: 60
chromosomes: all

BaseCellCalling:
Min_cell_types: 2
min_distance: 0
max_gnomAD_VAF: 0.01
min_ac_cells: 5
min_ac_reads: 20
alpha1: 0.21356677091082193
beta1: 104.95163748636298
alpha2: 0.2474528917555431
beta2: 162.03696139428595

HCCV:
min_depth: 20
deltaVAF: 0.25
deltaCCF: 0.4
min_depth: 50
deltaVAF: 0.2
deltaMCF: 0.25
clust_dist: 10000
chrM_contaminant: 'False'
alt_flag: All
pvalue: 0.01

Reannotation:
min_variants: 3
min_fraction: 0.25

### SNV Calling
SNVCalling:
cancer_ctype: Cancer
celltypes:
Cancer: ""
NonCancer: ""
min_ac_reads: 3
min_ac_cells: 2
clust_dist: 10000
clustermap:
height: 10
width: 15

scDNA:
Tumor_clone: 'Clone_Tum'
NonTumor_clone: 'Clone_NonTum'
BaseCellCounter:
min_mapping_quality: 30
min_dp: 5
min_cc: 1
BaseCellCalling:
min_ac_cells: 2
min_ac_reads: 3

scDNAValidation:
min_depth: 17

SComatic:
chrM_contaminant: 'True'

BaseCellCounter:
min_mapping_quality: 60
chromosomes: all
chromosomes: all

BaseCellCalling:
Min_cell_types: 2
RNA_editing: /cluster/work/bewi/members/dondia/projects/long_reads_tree/bin/SComatic/RNAediting/AllEditingSites.hg38.txt
min_distance: 0
PoN_SR: /cluster/work/bewi/members/dondia/projects/long_reads_tree/bin/SComatic/PoNs/PoN.scRNAseq.hg38.tsv
gnomAD_db: /cluster/work/bewi/members/dondia/projects/long_reads_tree/ref/gnomAD_v4.1
max_gnomAD_VAF: 0.01
deltaVAF: 0.1
deltaCCF: 0.3
min_ac_cells: 1
min_ac_reads: 1
deltaMCF: 0.3
min_ac_reads: 3
min_ac_cells: 2
clust_dist: 10000
chrM_contaminant: 'True'
alpha1: 0.21356677091082193
beta1: 104.95163748636298
alpha2: 0.2474528917555431
beta2: 162.03696139428595

### Fusion Calling
FusionCalling:
SomaticFusions:
min_ac_reads: 3
min_ac_cells: 2
max_MCF_noncancer: 0.1
deltaMCF: 0.3

### Cell Clustering
CellClust:

SingleCellGenotype:
alt_flag: All
pvalue: 0.01

BnpC:
outdir: '3kSteps.0.001-5dpa'
min_cells_per_mut: 5
min_pos_cov: 3
mcmc_steps: 1000
cup: 0
eup: 0
FP: -1
FN: -1
estimator: 'posterior'
pp: [1,1]
dpa:
B486: [0.001,5]
B497: [1,1]
B500: [1,1]
mut_order:
B486: '' #/cluster/work/bewi/members/dondia/projects/long_reads_tree/LongSom_out/OvCa_LR/BnpC/BnpC_input/B486.order.tsv'
B497: ''
B500: ''

FormatInput:
min_cells_per_mut: 5
min_pos_cov: 3

BnpC:
mcmc_steps: 1000
cup: 0
eup: 0
FP: -1
FN: -1
estimator: 'posterior'
pp: [1,1]
dpa: [1,1]

### CNA Calling
inferCNV:
ordering: /cluster/work/bewi/members/dondia/projects/long_reads_tree/bin/LongSom/InferCNV/gene_ordering_file.txt
ordering: ../scripts/CNACalling/gene_ordering_file.txt
18 changes: 5 additions & 13 deletions profile/config.yaml
Original file line number Diff line number Diff line change
@@ -1,19 +1,11 @@

executor: slurm
latency-wait: 60
latency-wait: 30
jobs: 500
cores: 100
cores: 500

default-resources:
cpus_per_task: 8
mem_mb_per_cpu: 1024
mem_mb_per_cpu: max(2*input.size_mb, 4096)
runtime: 240
slurm_account: "'es_beere'"
tmpdir: "'/scratch'"
time: 1200
runtime: 1200

set-threads:
BaseCellCounter_scDNACalling: 64
set-resources:
BaseCellCounter_scDNACalling:
cpus_per_task: 64
#tmpdir: /cluster/scratch/
2 changes: 2 additions & 0 deletions ref/.gitignore
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
GRCh38_gencode_v44_CTAT_lib_Oct292023.plug-n-play
gnomAD_v4.1
File renamed without changes.
File renamed without changes.
15 changes: 15 additions & 0 deletions run_LongSom.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
#!/usr/bin/env bash
OUTPUT_DIR=/path/to/output_dir
REF_DIR=path/to/LongSom/ref/GRCh38_gencode_v44_CTAT_lib_Oct292023.plug-n-play/ctat_genome_lib_build_dir

snakemake \
-s workflow/LongSom.smk \
--configfile config/config.yaml \
--use-conda \
--use-singularity \
--singularity-args "-B ${OUTPUT_DIR}:/output -B /tmp:/tmp -B ${REF_DIR}:/ref" \
--show-failed-logs \
--rerun-incomplete \
-p \


22 changes: 22 additions & 0 deletions run_LongSom_slurm.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,22 @@
#!/usr/bin/env bash
OUTPUT_DIR=/path/to/output_dir
REF_DIR=REF_DIR=path/to/LongSom/ref/GRCh38_gencode_v44_CTAT_lib_Oct292023.plug-n-play/ctat_genome_lib_build_dir

mkdir -p logs
mkdir -p ${OUTPUT_DIR}
sbatch \
--time=20:00:00 \
-o logs/snakelog.out \
-e logs/snakelog.err \
snakemake \
-s workflow/Snakefile \
--configfile workflow/test.yaml \
--profile profile/ \
--use-conda \
--use-singularity \
--singularity-args "-B ${OUTPUT_DIR}:/output -B /tmp:/tmp -B ${REF_DIR}:/ref" \
--show-failed-logs \
--rerun-incomplete \
-p \
"$@"

18 changes: 0 additions & 18 deletions run_SComatic.sh

This file was deleted.

Loading

0 comments on commit 9a259ff

Please sign in to comment.