self.dataset = []
- self.read_size = Conf.read_size
+ self.read_size = 38
+ #self.prb_offset = 50
+ self.prb_offset = 64
self.half_window_size = 1500
assert not os.path.exists(dataset_fn), 'The data_file already exists!'
assert not os.path.exists(dataset_keys_fn), 'The data_keys file already exists!'
+ #pdb.set_trace()
# saving new dataset and single keys as well
cPickle.dump(self.dataset,open(dataset_fn,'w+'),protocol=2)
cPickle.dump(self.dataset.keys(),open(dataset_keys_fn,'w+'),protocol=2)
# In order to save some space we use a signed char to store the
# qualities. Each quality element can range as follows: -128 <= elem <= 127
- prb = array.array('b',map(lambda x: ord(x)-64,slist[5]))
+
+ prb = array.array('b',map(lambda x: ord(x)-self.prb_offset,slist[5]))
# add instance to set
currentSeqInfo = (id,chromo,strand,genomicSeq_start,genomicSeq_stop)