Skip to content

Commit

Permalink
update
Browse files Browse the repository at this point in the history
  • Loading branch information
Zhuoqing Fang committed Sep 24, 2017
1 parent befd6f7 commit 468df06
Show file tree
Hide file tree
Showing 3 changed files with 41 additions and 29 deletions.
54 changes: 27 additions & 27 deletions config.yml
Original file line number Diff line number Diff line change
Expand Up @@ -2,19 +2,19 @@
# 2017-03-28

# dir contains all indexes, genome sequences
genome: "/Users/bioninja/genome"
genome: "/Users/bioninja/genome/Human_GRCh38"
# Path to an uncompressed FASTA file with all choromsome genome sequences.
# we use gencode archive, downlaod from here:
# we use gencode archive, downlaod from here:
# http://www.gencodegenes.org/releases/current.html
fasta: "/Users/bioninja/genome/Human_GRCh38/GRCh38.p10.genome.fa"

# Path to an uncompressed FASTA file with all transcript sequences.
# we use gencode archive, downlaod from here:
# we use gencode archive, downlaod from here:
# http://www.gencodegenes.org/releases/current.html
cdna: "/Users/bioninja/genome/Human_GRCh38/gencode.v26.transcripts.fa"

# GTF file path
# we use gencode archive, downlaod from here:
# we use gencode archive, downlaod from here:
# http://www.gencodegenes.org/releases/current.html
gtf: "/Users/bioninja/genome/Human_GRCh38/gencode.v26.annotation.gtf"

Expand All @@ -26,18 +26,18 @@ salmon_index: "/Users/bioninja/genome/Human_GRCh38/salmonIndices_hg38"
index_prefix: "hg38"

# Full path to a folder where output files will be created.
workdir: "/Users/bioninja/public-seq/H170013-P001/"
workdir: "/Volumes/G-DRIVE/DBRL/fzq/"

# extra scripts' dir for running. e.g preDEseq.py (StringTie)
scripts: "/Users/bioninja/public-seq/H170013-P001/snakeflow/scripts"
scripts: "/Volumes/G-DRIVE/DBRL/fzq/snakeflow/scripts"

# Full path to a folder that holds all of your FASTQ files
fastq_dir: "/Users/bioninja/public-seq/H170013-P001/fastq_clean"
fastq_dir: "/Volumes/G-DRIVE/DBRL/fzq/fastq_clean"



# Sequencing read length, only reqired for running rMATS or preDEseq.py.
read_length: 150
read_length: 50

# Paired end sequencing library? True or False.
paired: True
Expand All @@ -50,49 +50,49 @@ stranded: False
# information in `samples` is used for deseq2 and rMATS
samples:
# fastq files prefix, seperate each sample by space
name: "WGC096874R WGC096875R WGC096876R WGC096877R" # keep order for each sample
name: "WGC74R WGC75R WGC76R WGC77R" # keep order for each sample
# short names for sample names
alias: "S74 S75 S76 S77" # optional

#Any lable name to indicate sample's group/condition where they belong to.
#keep the same order with `name`
group: "Normal Control Normal Control"
#keep the same order with `name`
group: "Normal Control Normal Control"
# optional, if your data is not time-series, ignore `time` attr.
time: "0 0 0 0"
time: "0 0 0 0"

# ``dataframe``attribute works only if a file is given.
# each column names correspond to the samples' attributes of above.
coldata: "/Users/bioninja/public-seq/H170013-P001/sample_info_single.txt" #
coldata: "/Volumes/G-DRIVE/DBRL/fzq/sample_info_single.txt" #

# a sampleTable.txt look like this.
### name alias conditon treatment
## WGC096874R S74 Normal 0
## WGC096875R S75 Cancer 0
## WGC096876R S76 Normal 0
## WGC096877R S77 Cancer 0
enrichr_library: ['GO_Cellular_Component_2015','GO_Molecular_Function_2015',
'GO_Biological_Process_2015','Human_Phenotype_Ontology',
## WGC096877R S77 Cancer 0
enrichr_library: ['GO_Cellular_Component_2017b','GO_Molecular_Function_2017b',
'GO_Biological_Process_2017b','Human_Phenotype_Ontology',
'MSigDB_Oncogenic_Signatures','WikiPathways_2016',
'KEGG_2016']

# RNA Binding Protein list
rbps: "/Users/bioninja/public-seq/H170013-P001/snakeflow/221RBPs.csv"
# RNA Binding Protein list
rbps: "/Volumes/G-DRIVE/DBRL/fzq/snakeflow/221RBPs.csv"
# Before running with your samples,
# please rename all your samples with the same suffix below.
# for example, rename all your sample like this: "WGC096874R_combined_R1.fastq.gz"
# for trimed fastq, use suffix like: _trimmed.fq.gz
read_pattern:
r1: "{sample}_R1_val_1.fq.gz" # don't change {sample}
r2: "{sample}_R2_val_2.fq.gz" # don't change {sample}
fastqc: "qc/fastqc/{sample}_R1_val_1_fastqc.{suf}"
read_pattern:
r1: "{sample}_1.fq.gz" # don't change {sample}
r2: "{sample}_2.fq.gz" # don't change {sample}
fastqc: "qc/fastqc/{sample}_1_fastqc.{suf}"

# RSeQC bed file
# this two files are optional, if you do not need to run RSeQC.
# Download from https://sourceforge.net/projects/rseqc/files/BED/Human_Homo_sapiens/
rseqc:
rseqc:
refseq: "/Users/bioninja/genome/rseqc_ann/hg38_RefSeq.bed"
housekeep: "/Users/bioninja/genome/rseqc_ann/hg38.HouseKeepingGenes.bed"

#trimmonatic adaptors
#trimmonatic adaptors
adaptors:
illumina: "/Users/bioninja/github/snakeflow/adaptors/TruSeq3-PE.fa"
illumina: "/Users/bioninja/github/snakeflow/adaptors/TruSeq3-PE.fa"
14 changes: 13 additions & 1 deletion example/sample_info_single.txt
Original file line number Diff line number Diff line change
@@ -1 +1,13 @@
#file alias condition treatmentS526_09B_CHG022991-GATCAG_L005 R1 DMSO 0S526_09B_CHG022992-TAGCTT_L005 R2 DMSO 0S526_09B_CHG022993-GGCTAC_L005 R3 DMSO 0S526_09B_CHG022994-CTTGTA_L005 RA1 RA 0S526_02A_CHG022995-ATCACG_L001 RA2 RA 0S526_02A_CHG022996-CGATGT_L001 RA3 RA 0S526_02A_CHG022997-TTAGGC_L001 RK1 RK 0S526_02A_CHG022998-TGACCA_L001 RK2 RK 0S526_02A_CHG022999-ACAGTG_L001 RK3 RK 0S526_02A_CHG023000-GCCAAT_L001 RKA1 RKA 0S526_02A_CHG023001-CAGATC_L001 RKA2 RKA 0S526_02A_CHG023002-ACTTGA_L001 RKA3 RKA 0
#file alias condition treatment
WT_D0_A WTD0A WT0 0
WT_D0_B WTD0B WT0 0
WT_D2_A WTD2A WT2 0
WT_D2_B WTD2B WT2 0
WT_D3_A WTD3A WT3 0
WT_D3_B WTD3B WT3 0
S13_D0_A S13D0A KO0 0
S13_D0_B S13D0B KO0 0
S13_D2_A S13D2A KO2 0
S13_D2_B S13D2B KO2 0
S13_D3_A S13D3A KO3 0
S13_D3_B S13D3B KO3 0
2 changes: 1 addition & 1 deletion salmon-tximport-deseq2-v0.2.snakefile
Original file line number Diff line number Diff line change
Expand Up @@ -216,7 +216,7 @@ rule deseq2:
group=" ".join(GROUP),#used for grouping each sample, to dectect degs.
time=" ".join(TIME),
alias=" ".join(SAMPLES_ALIAS)
threads: 4
threads: 8
script:
"scripts/runDESeq2.R"

Expand Down

0 comments on commit 468df06

Please sign in to comment.