print'Other time since import %.3fs %.1f%%'%(other_time,other_time/total_time*100)
print'%i Theano fct call, %.3fs per call'%(total_fct_call,time_per_call)
print'Other time since import %.3fs %.1f%%'%(other_time,other_time/total_time*100)
print'%i Theano fct call, %.3fs per call'%(total_fct_call,time_per_call)
print
print"List of apply that don't have float64 as input but have float64 in outputs. Usefull to know if we forgot some cast when using floatX=float32 or gpu code."
...
...
@@ -1236,7 +1244,7 @@ if 0: # old code still to be ported from ProfileMode
scalar_op_amdlibm_speed_up=[scal.Mod,scal.Pow,scal.Ceil,scal.Floor,scal.RoundHalfToEven,scal.RoundHalfAwayFromZero,scal.Log,scal.Log2,scal.Log10,scal.Log1p,scal.Exp,scal.Sqrt,scal.Abs,scal.Cos,scal.Sin,scal.Tan,scal.Tanh,scal.Cosh,scal.Sinh,T.nnet.sigm.ScalarSigmoid,T.nnet.sigm.ScalarSoftplus]#Abs, Mod in float{32,64} only
scal.Sqrt,scal.Abs,scal.Cos,scal.Sin,scal.Tan,scal.Tanh,scal.Cosh,scal.Sinh,T.nnet.sigm.ScalarSigmoid,T.nnet.sigm.ScalarSoftplus]# Abs, Mod in float{32,64} only
print" - With the default gcc libm, exp in float32 is slower than in float64! Try Theano flags floatX=float64 or install amdlibm and set the theano flags lib.amdlibm=True"