Open AzamatB opened 4 years ago
Results on the small size neural net with the following dimensions
encoder_dims = (
blstm = (in = (length ∘ first ∘ first)(Xs), out = 64),
pblstms_out = (64, 64, 64)
)
attention_dim = 64
decoder_out_dims = (128, 64)
m = LAS(encoder_dims, attention_dim, decoder_out_dims, out_dim)
for xs = last(Xs_train); Xs = vecofmats2tensor(xs)
julia> reset!(m); Hs′ = permutedims(Hs, [1,2,3]);
julia> @benchmark fdtb($m, $Hs′, $ψhs)
BenchmarkTools.Trial:
memory estimate: 2.32 GiB
allocs estimate: 237186
--------------
minimum time: 2.056 s (10.21% GC)
median time: 2.061 s (11.02% GC)
mean time: 2.076 s (10.89% GC)
maximum time: 2.110 s (11.43% GC)
--------------
samples: 3
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [1,3,2]);
julia> @benchmark fdbt($m, $Hs′, $ψhs)
BenchmarkTools.Trial:
memory estimate: 2.32 GiB
allocs estimate: 248585
--------------
minimum time: 2.211 s (9.53% GC)
median time: 2.217 s (9.76% GC)
mean time: 2.255 s (9.85% GC)
maximum time: 2.338 s (10.24% GC)
--------------
samples: 3
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [2,1,3]);
julia> @benchmark ftdb($m, $Hs′, $ψhs)
BenchmarkTools.Trial:
memory estimate: 2.32 GiB
allocs estimate: 229585
--------------
minimum time: 2.280 s (10.04% GC)
median time: 2.319 s (10.19% GC)
mean time: 2.313 s (10.30% GC)
maximum time: 2.339 s (10.65% GC)
--------------
samples: 3
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [3,2,1]);
julia> @benchmark fbtd($m, $Hs′, $ψhs)
BenchmarkTools.Trial:
memory estimate: 2.33 GiB
allocs estimate: 249345
--------------
minimum time: 2.295 s (9.64% GC)
median time: 2.328 s (10.05% GC)
mean time: 2.319 s (10.03% GC)
maximum time: 2.334 s (10.02% GC)
--------------
samples: 3
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [2,3,1]);
julia> @benchmark ftbd($m, $Hs′, $ψhs)
BenchmarkTools.Trial:
memory estimate: 2.33 GiB
allocs estimate: 228825
--------------
minimum time: 2.227 s (10.22% GC)
median time: 2.243 s (10.14% GC)
mean time: 2.331 s (9.88% GC)
maximum time: 2.523 s (9.48% GC)
--------------
samples: 3
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [1,2,3]);
julia> @benchmark gfdtb($m, $Hs′, $ψhs, $θ)
BenchmarkTools.Trial:
memory estimate: 13.72 GiB
allocs estimate: 2049836
--------------
minimum time: 20.062 s (58.75% GC)
median time: 20.062 s (58.75% GC)
mean time: 20.062 s (58.75% GC)
maximum time: 20.062 s (58.75% GC)
--------------
samples: 1
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [1,3,2]);
julia> @benchmark gfdbt($m, $Hs′, $ψhs, $θ)
BenchmarkTools.Trial:
memory estimate: 13.72 GiB
allocs estimate: 2077195
--------------
minimum time: 19.861 s (58.31% GC)
median time: 19.861 s (58.31% GC)
mean time: 19.861 s (58.31% GC)
maximum time: 19.861 s (58.31% GC)
--------------
samples: 1
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [2,1,3]);
julia> @benchmark gftdb($m, $Hs′, $ψhs, $θ)
BenchmarkTools.Trial:
memory estimate: 13.72 GiB
allocs estimate: 2042235
--------------
minimum time: 20.234 s (57.38% GC)
median time: 20.234 s (57.38% GC)
mean time: 20.234 s (57.38% GC)
maximum time: 20.234 s (57.38% GC)
--------------
samples: 1
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [3,2,1]);
julia> @benchmark gfbtd($m, $Hs′, $ψhs, $θ)
BenchmarkTools.Trial:
memory estimate: 13.75 GiB
allocs estimate: 2074915
--------------
minimum time: 20.462 s (57.27% GC)
median time: 20.462 s (57.27% GC)
mean time: 20.462 s (57.27% GC)
maximum time: 20.462 s (57.27% GC)
--------------
samples: 1
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [2,3,1]);
julia> @benchmark gftbd($m, $Hs′, $ψhs, $θ)
BenchmarkTools.Trial:
memory estimate: 13.75 GiB
allocs estimate: 2038435
--------------
minimum time: 20.262 s (57.72% GC)
median time: 20.262 s (57.72% GC)
mean time: 20.262 s (57.72% GC)
maximum time: 20.262 s (57.72% GC)
--------------
samples: 1
evals/sample: 1
for xs = first(Xs_train); Xs = vecofmats2tensor(xs)
julia> reset!(m); Hs′ = permutedims(Hs, [1,2,3]);
julia> @benchmark fdtb($m, $Hs′, $ψhs)
BenchmarkTools.Trial:
memory estimate: 1.15 GiB
allocs estimate: 33844
--------------
minimum time: 1.339 s (7.84% GC)
median time: 1.364 s (8.91% GC)
mean time: 1.360 s (8.79% GC)
maximum time: 1.371 s (8.49% GC)
--------------
samples: 4
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [1,3,2]);
julia> @benchmark fdbt($m, $Hs′, $ψhs)
BenchmarkTools.Trial:
memory estimate: 1.15 GiB
allocs estimate: 36363
--------------
minimum time: 1.339 s (7.94% GC)
median time: 1.373 s (9.06% GC)
mean time: 1.369 s (8.90% GC)
maximum time: 1.391 s (8.63% GC)
--------------
samples: 4
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [2,1,3]);
julia> @benchmark ftdb($m, $Hs′, $ψhs)
BenchmarkTools.Trial:
memory estimate: 1.15 GiB
allocs estimate: 32163
--------------
minimum time: 1.471 s (7.80% GC)
median time: 1.482 s (8.55% GC)
mean time: 1.489 s (8.60% GC)
maximum time: 1.524 s (9.47% GC)
--------------
samples: 4
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [3,2,1]);
julia> @benchmark fbtd($m, $Hs′, $ψhs)
BenchmarkTools.Trial:
memory estimate: 1.16 GiB
allocs estimate: 36531
--------------
minimum time: 1.371 s (8.18% GC)
median time: 1.417 s (9.05% GC)
mean time: 1.412 s (9.05% GC)
maximum time: 1.444 s (9.88% GC)
--------------
samples: 4
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [2,3,1]);
julia> @benchmark ftbd($m, $Hs′, $ψhs)
BenchmarkTools.Trial:
memory estimate: 1.16 GiB
allocs estimate: 31995
--------------
minimum time: 1.420 s (7.78% GC)
median time: 1.455 s (8.21% GC)
mean time: 1.448 s (8.38% GC)
maximum time: 1.461 s (8.31% GC)
--------------
samples: 4
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [1,2,3]);
julia> @benchmark gfdtb($m, $Hs′, $ψhs, $θ)
BenchmarkTools.Trial:
memory estimate: 4.39 GiB
allocs estimate: 280749
--------------
minimum time: 4.613 s (17.69% GC)
median time: 4.658 s (18.04% GC)
mean time: 4.658 s (18.04% GC)
maximum time: 4.702 s (18.38% GC)
--------------
samples: 2
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [1,3,2]);
julia> @benchmark gfdbt($m, $Hs′, $ψhs, $θ)
BenchmarkTools.Trial:
memory estimate: 4.39 GiB
allocs estimate: 286796
--------------
minimum time: 4.632 s (17.63% GC)
median time: 4.668 s (18.03% GC)
mean time: 4.668 s (18.03% GC)
maximum time: 4.704 s (18.43% GC)
--------------
samples: 2
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [2,1,3]);
julia> @benchmark gftdb($m, $Hs′, $ψhs, $θ)
BenchmarkTools.Trial:
memory estimate: 4.39 GiB
allocs estimate: 279068
--------------
minimum time: 4.798 s (15.06% GC)
median time: 4.959 s (17.10% GC)
mean time: 4.959 s (17.10% GC)
maximum time: 5.120 s (19.01% GC)
--------------
samples: 2
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [3,2,1]);
julia> @benchmark gfbtd($m, $Hs′, $ψhs, $θ)
BenchmarkTools.Trial:
memory estimate: 4.41 GiB
allocs estimate: 286292
--------------
minimum time: 4.584 s (15.84% GC)
median time: 4.705 s (18.05% GC)
mean time: 4.705 s (18.05% GC)
maximum time: 4.827 s (20.14% GC)
--------------
samples: 2
evals/sample: 1
julia> reset!(m); Hs′ = permutedims(Hs, [2,3,1]);
julia> @benchmark gftbd($m, $Hs′, $ψhs, $θ)
BenchmarkTools.Trial:
memory estimate: 4.41 GiB
allocs estimate: 278228
--------------
minimum time: 4.809 s (15.06% GC)
median time: 4.969 s (17.10% GC)
mean time: 4.969 s (17.10% GC)
maximum time: 5.129 s (19.02% GC)
--------------
samples: 2
evals/sample: 1
Benchmarking results are