Commit 523b941b authored by Chris Cheshire's avatar Chris Cheshire
Browse files

Added explicit dask data type resolution

parent 30d47964
Loading
Loading
Loading
Loading
+2 −2
Original line number Diff line number Diff line
@@ -35,7 +35,7 @@ peak_perc = 0
print('Reading file')

# Read file in using dask
ddf_inter = dd.read_csv(args.intersect, sep='\t', header=None, names=['chrom','start','end','overlap_1','key','a_name','b_name','count'])
ddf_inter = dd.read_csv(args.intersect, sep='\t', header=None, names=['chrom','start','end','overlap_1','key','a_name','b_name','count'], dtype={'overlap_1': 'float64'})

# Find number of files
numfiles = ddf_inter['b_name'].max().compute()
@@ -44,7 +44,7 @@ numfiles = ddf_inter['b_name'].max().compute()
if isinstance(numfiles, str):
    print('Detected single file, reloading table')
    numfiles = 1
    ddf_inter = dd.read_csv(args.intersect, sep='\t', header=None, names=['chrom','start','end','overlap_1','overlap_2','key','name','count'])
    ddf_inter = dd.read_csv(args.intersect, sep='\t', header=None, names=['chrom','start','end','overlap_1','overlap_2','key','name','count'], dtype={'overlap_1': 'float64', 'overlap_2': 'float64'})

print('Number of files: ' + str(numfiles))