2 # -*- coding: utf-8 -*-
6 def paths_load_data_pickle(expt
,genome_info
,PAR
):
11 # function [Sequences, Acceptors, Donors, Exons, Ests, Noises] = paths_load_data(expt,genome_info,PAR)
12 # Load the relevant file and return the alignment data
14 # expt can be 'training','validation' or 'test'
16 assert expt
in ['training','validation','test']
18 tmp_dir
= '/fml/ag-raetsch/home/fabio/tmp'
22 if expt
== 'training':
24 if PAR
.LOCAL_ALIGN
: # local version
26 train_data
= '%s/microexon_train_data.pickle' % genome_info
.basedir
27 data
= cPickle
.load(open(train_data
))
29 else: # global version
34 train_data
= '%s/exons_train_local.pickle' % genome_info
.basedir
35 data
= cPickle
.load(open(train_data
))
37 print 'train_data is %s' % train_data
39 Sequences
= data
['Train'] # dna sequences
40 Acceptors
= data
['TrainAcc'] # acceptor scores
41 Donors
= data
['TrainDon'] # donor scores
42 Exons
= data
['TrainExon'] # exon boundaries
43 Ests
= data
['TrainEsts'] # est sequences
45 # Lower all indices by one to convert matlab
50 return Sequences
, Acceptors
, Donors
, Exons
, Ests
, Noises