-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathPlinkSnakefile
56 lines (50 loc) · 1.61 KB
/
PlinkSnakefile
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
"""Redfish data filtering and conversion to Plink format
Input:
vcf : a variant call format file defined in the config file. Default is `qual_filtered_redfishamplicon_calls.vcf`
Returns:
ped/map: a filtered ped and map file pair in plink format for use with subsequent data analysis.
"""
configfile: "config.json" #this file generated with `python redfish_snake_setup.py`
rule all:
input:
config["plink"] + ".ped",
config["plink"] + ".map"
rule plink_filter:
"""
Convert vcf to plink format.
Produce BED/BIM output pair for subsequent use.
"""
input:
vcf=config["vcf"]
output:
bim=config["plink"] + ".bed",
bam=config["plink"] + ".bim",
fam=config["plink"] + ".fam"
params:
plink_filename = config["plink"]
log:
"logs/bwa_mem/plink_process.log"
threads: 24
shell:
"plink --vcf {input.vcf} --allow-extra-chr --make-bed "
"--double-id --maf 0.01 --geno 0.05 --mind 0.2 "
"--out {params.plink_filename}"
rule plink_recode:
"""
Recode as a PED/MAP pair
"""
input:
bim=config["plink"] + ".bed",
bam=config["plink"] + ".bim",
fam=config["plink"] + ".fam"
output:
ped=config["plink"] + ".ped",
map=config["plink"] + ".map",
params:
plink_filename = config["plink"]
log:
"logs/bwa_mem/plink_recode.log"
threads: 24
shell:
"plink --bfile {params.plink_filename} "
" --recode --tab --allow-extra-chr --out {params.plink_filename} "