In [1]:
from __future__ import print_function
import keras
from keras.models import Sequential, Model, load_model
from keras import backend as K
import tensorflow as tf
import isolearn.keras as iso
import os
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import matplotlib.cm as cm
from keras.utils import plot_model


from aparent.predictor import *
##################################################
#import bioPython for working with FASTA files
from Bio import SeqIO
##################################################


#loading model
aparent_model = load_model('./saved_models/aparent_large_lessdropout_all_libs_no_sampleweights.h5')
plot_model(aparent_model, show_shapes = True, to_file='APARENTmodel.png')
aparent_encoder = get_aparent_encoder(lib_bias=4)

#setting up files
fastaDestination = "./fastas/"
fastaNames = ["KI270418.1", "KI270587.1"]
predDestination = "./PredictionBinaries/"
strideSizes = [1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,20,25,30,35,40,45,50]

#running files
for name in fastaNames:
    contigSeq = SeqIO.read(fastaDestination + name + ".fasta", "fasta")
    seq = contigSeq.seq #actual genomic sequence from the file
    print ("PREDICTING ", contigSeq.id, " with length ", len(seq))
    for stride in strideSizes:
            print ("Stride length is: ", stride)
            x,y = find_polya_peaks_memoryFriendly(
                aparent_model,
                aparent_encoder,
                seq,
                sequence_stride=stride,
                conv_smoothing=False,
                peak_min_height=0.01,
                peak_min_distance=50,
                peak_prominence=(0.01, None),
            )
            repPeriod = name.replace(".", "_")
            np.save(predDestination + name + "Predictions/" +repPeriod + "_cutPredsStrideLen" + str(stride), y )
    print ("FINISHED")



Using TensorFlow backend.
  _np_qint8 = np.dtype([("qint8", np.int8, 1)])
  _np_quint8 = np.dtype([("quint8", np.uint8, 1)])
  _np_qint16 = np.dtype([("qint16", np.int16, 1)])
  _np_quint16 = np.dtype([("quint16", np.uint16, 1)])
  _np_qint32 = np.dtype([("qint32", np.int32, 1)])
  np_resource = np.dtype([("resource", np.ubyte, 1)])
  _np_qint8 = np.dtype([("qint8", np.int8, 1)])
  _np_quint8 = np.dtype([("quint8", np.uint8, 1)])
  _np_qint16 = np.dtype([("qint16", np.int16, 1)])
  _np_quint16 = np.dtype([("quint16", np.uint16, 1)])
  _np_qint32 = np.dtype([("qint32", np.int32, 1)])
  np_resource = np.dtype([("resource", np.ubyte, 1)])







PREDICTING  KI270418.1  with length  2145
Stride length is:  1

Stride length is:  2
Stride length is:  3
Stride length is:  4
Stride length is:  5
Stride length is:  6
Stride length is:  7
Stride length is:  8
Stride length is:  9
Stride length is:  10
Stride length is:  11
Stride length is:  12
Stride length is:  13
Stride length is:  14
Stride length is:  15
Stride length is:  20
Stride length is:  25
Stride length is:  30
Stride length is:  35
Stride length is:  40
Stride length is:  45
Stride length is:  50
FINISHED
PREDICTING  KI270587.1  with length  2969
Stride length is:  1
Stride length is:  2
Stride length is:  3
Stride length is:  4
Stride length is:  5
Stride length is:  6
Stride length is:  7
Stride length is:  8
Stride length is:  9
Stride length is:  10
Stride length is:  11
Stride length is:  12
Stride length is:  13
Stride length is:  14
Stride length is:  15
Stride length is:  20
Stride length is:  25
Stride length is:  30
Stride length is:  35
Stride length is:  40
