Skip to content

Commit 3c40013

Browse files
authored
Merge pull request #92 from jemten/fix_format_column
changing RD to DR in format column
2 parents 71f8ffd + d55186d commit 3c40013

File tree

3 files changed

+25
-25
lines changed

3 files changed

+25
-25
lines changed

setup.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@
2020

2121
setup(
2222
name = 'tiddit',
23-
version = '3.3.0',
23+
version = '3.3.1',
2424

2525
url = "https://github.com/SciLifeLab/TIDDIT",
2626
author = "Jesper Eisfeldt",

tiddit/__main__.py

Lines changed: 11 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@
1717
import tiddit.tiddit_contig_analysis as tiddit_contig_analysis
1818

1919
def main():
20-
version="3.3.0"
20+
version="3.3.1"
2121
parser = argparse.ArgumentParser("""tiddit-{}""".format(version),add_help=False)
2222
parser.add_argument("--sv" , help="call structural variation", required=False, action="store_true")
2323
parser.add_argument("--cov" , help="generate a coverage bed file", required=False, action="store_true")
@@ -88,7 +88,7 @@ def main():
8888
if not os.path.isfile(args.bam):
8989
print ("error, could not find the bam file")
9090
quit()
91-
91+
9292
bam_file_name=args.bam
9393
samfile = pysam.AlignmentFile(bam_file_name, "r",reference_filename=args.ref)
9494

@@ -122,10 +122,10 @@ def main():
122122
print("Folder already exists")
123123

124124
pysam.index("-c","-m","6","-@",str(args.threads),bam_file_name,"{}_tiddit/{}.csi".format(args.o,sample_id))
125-
125+
126126
min_mapq=args.q
127127
max_ins_len=100000
128-
n_reads=args.s
128+
n_reads=args.s
129129

130130
library=tiddit_stats.statistics(bam_file_name,args.ref,min_mapq,max_ins_len,n_reads)
131131
if args.i:
@@ -153,29 +153,29 @@ def main():
153153
print(time.time()-t)
154154

155155
vcf_header=tiddit_vcf_header.main( bam_header,library,sample_id,version )
156-
156+
157157
if not args.e:
158158
args.e=int(library["avg_insert_size"]/2.0)
159-
159+
160160
t=time.time()
161161
sv_clusters=tiddit_cluster.main(prefix,contigs,contig_length,samples,library["mp"],args.e,args.l,max_ins_len,args.min_contig,args.skip_assembly)
162-
162+
163163
print("generated clusters in")
164164
print(time.time()-t)
165-
165+
166166
f=open(prefix+".vcf","w")
167167
f.write(vcf_header+"\n")
168-
168+
169169
t=time.time()
170170
variants=tiddit_variant.main(bam_file_name,sv_clusters,args,library,min_mapq,samples,coverage_data,contig_number,max_ins_len)
171171
print("analyzed clusters in")
172172
print(time.time()-t)
173-
173+
174174
for chr in contigs:
175175
if not chr in variants:
176176
continue
177177
for variant in sorted(variants[chr], key=lambda x: x[0]):
178-
f.write( "\t".join(variant[1])+"\n" )
178+
f.write( "\t".join(variant[1])+"\n" )
179179
f.close()
180180
quit()
181181

tiddit/tiddit_variant.pyx

Lines changed: 13 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@ def get_region(samfile,str chr,int start,int end,int bp,int min_q,int max_ins, c
2323

2424
q_start=start
2525
q_end=end+max_ins
26-
26+
2727
if q_end > contig_length:
2828
q_end=contig_length
2929

@@ -44,14 +44,14 @@ def get_region(samfile,str chr,int start,int end,int bp,int min_q,int max_ins, c
4444

4545
if not read.mate_is_unmapped:
4646
if read.next_reference_start > end and read_reference_start > end:
47-
continue
47+
continue
4848
else:
4949
if read_reference_start > end:
5050
continue
5151

5252
if read.is_duplicate:
5353
continue
54-
54+
5555
if not (read_reference_start > end):
5656
n_reads+=1
5757
if read.mapq < min_q:
@@ -83,7 +83,7 @@ def get_region(samfile,str chr,int start,int end,int bp,int min_q,int max_ins, c
8383

8484
if read_reference_start < start:
8585
r_start=start
86-
86+
8787
if read_reference_end > end:
8888
r_end=end
8989

@@ -133,7 +133,7 @@ def find_sv_type(chrA,chrB,inverted,non_inverted,args,sample_data,samples,librar
133133
return("DUP:TANDEM",cn)
134134
elif cn < p:
135135
return("DEL",cn)
136-
136+
137137
elif inverted > non_inverted:
138138
return("INV",cn)
139139
else:
@@ -253,7 +253,7 @@ def define_variant(str chrA, str bam_file_name,dict sv_clusters,args,dict librar
253253
s=int(math.floor(posA/50.0))
254254
e=int(math.floor(posB/50.0))+1
255255
sample_data[sample]["covM"]=numpy.average(coverage_data[chrA][s:e] )
256-
256+
257257
inverted=0
258258
non_inverted=0
259259
for i in range(0,len(sv_clusters[chrA][chrB][cluster]["positions_A"]["orientation_discordants"]) ):
@@ -277,12 +277,12 @@ def define_variant(str chrA, str bam_file_name,dict sv_clusters,args,dict librar
277277
svtype,cn=find_sv_type(chrA,chrB,inverted,non_inverted,args,sample_data,samples,library)
278278

279279
filt=sv_filter(sample_data,args,chrA,chrB,posA,posB,max_ins_len,n_discordants,n_splits,library,sample_data[sample]["discA"],sample_data[sample]["discB"],sample_data[sample]["splitA"],sample_data[sample]["splitB"],n_contigs)
280-
format_col="GT:CN:COV:DV:RV:LQ:RR:RD"
280+
format_col="GT:CN:COV:DV:RV:LQ:RR:DR"
281281

282282
#configure filters for CNV based on Read depth
283283
for sample in samples:
284284
if "DEL" in svtype:
285-
#homozygout del based on coverage
285+
#homozygout del based on coverage
286286
if cn == 0:
287287
filt="PASS"
288288

@@ -294,7 +294,7 @@ def define_variant(str chrA, str bam_file_name,dict sv_clusters,args,dict librar
294294
if covA > covM*(cn+0.9) and covB > covM*(cn+0.9):
295295
filt="PASS"
296296

297-
#too few reads, but clear RD signal
297+
#too few reads, but clear DR signal
298298
elif "DUP" in svtype and filt == "BelowExpectedLinks":
299299
filt="PASS"
300300

@@ -361,7 +361,7 @@ def define_variant(str chrA, str bam_file_name,dict sv_clusters,args,dict librar
361361
GT= "1/1"
362362
else:
363363
GT="0/1"
364-
364+
365365
variant.append( "{}:{}:{},{},{}:{}:{}:{},{}:{},{}:{},{}".format(GT,cn,sample_data[sample]["covA"],sample_data[sample]["covM"],sample_data[sample]["covB"],n_discordants,n_splits,sample_data[sample]["QA"],sample_data[sample]["QB"],sample_data[sample]["refRA"],sample_data[sample]["refRB"],sample_data[sample]["refFA"],sample_data[sample]["refFB"]) )
366366
variants.append([chrA,posA,variant])
367367
else:
@@ -472,7 +472,7 @@ def define_variant(str chrA, str bam_file_name,dict sv_clusters,args,dict librar
472472

473473

474474
variant.append( "{}:{}:{},{},{}:{}:{}:{},{}:{},{}:{},{}".format(GT,cn,sample_data[sample]["covA"],sample_data[sample]["covM"],sample_data[sample]["covB"],n_discordants,n_splits,sample_data[sample]["QA"],sample_data[sample]["QB"],sample_data[sample]["refRA"],sample_data[sample]["refRB"],sample_data[sample]["refFA"],sample_data[sample]["refFB"]) )
475-
variants.append([chrB,posB,variant])
475+
variants.append([chrB,posB,variant])
476476

477477
samfile.close()
478478
return(variants)
@@ -481,7 +481,7 @@ def main(str bam_file_name,dict sv_clusters,args,dict library,int min_mapq,sampl
481481
contig_seqs={}
482482
new_seq=False
483483
if not args.skip_assembly:
484-
for line in open("{}_tiddit/clips.fa.assembly.clean.mag".format(args.o)):
484+
for line in open("{}_tiddit/clips.fa.assembly.clean.mag".format(args.o)):
485485

486486
if not new_seq and line[0] == "@" and "\t" in line:
487487
name=line.split("\t")[0][1:]
@@ -501,5 +501,5 @@ def main(str bam_file_name,dict sv_clusters,args,dict library,int min_mapq,sampl
501501
for v in variants_list:
502502
for variant in v:
503503
variants[ variant[0] ].append( [ variant[1],variant[2] ] )
504-
504+
505505
return(variants)

0 commit comments

Comments
 (0)