JuliaGPU / CUDA.jl

CUDA programming in Julia.
https://juliagpu.org/cuda/
Other
1.2k stars 215 forks source link

gemmEx on sm_52 results in CUBLAS_STATUS_ARCH_MISMATCH #609

Closed mkarikom closed 3 years ago

mkarikom commented 3 years ago

Describe the bug

Pkg.test("CUDA") cublas errors

To reproduce

Pkg.add("CUDA")
using CUDA
Pkg.test("CUDA")
Manifest.toml

``` # This file is machine-generated - editing it directly is not advised [[AbstractFFTs]] deps = ["LinearAlgebra"] git-tree-sha1 = "051c95d6836228d120f5f4b984dd5aba1624f716" uuid = "621f4979-c628-5d54-868e-fcf4e3e8185c" version = "0.5.0" [[AbstractMCMC]] deps = ["BangBang", "ConsoleProgressMonitor", "Distributed", "Logging", "LoggingExtras", "ProgressLogging", "Random", "StatsBase", "TerminalLoggers", "Transducers"] git-tree-sha1 = "c8988bdf7cb820932be1c8bd59dcbb806279e36f" uuid = "80f14c24-f653-4e6a-9b94-39d6b0f70001" version = "2.2.1" [[AbstractTrees]] deps = ["Markdown"] git-tree-sha1 = "33e450545eaf7699da1a6e755f9ea65f14077a45" uuid = "1520ce14-60c1-5f80-bbc7-55ef81b5835c" version = "0.3.3" [[Adapt]] deps = ["LinearAlgebra"] git-tree-sha1 = "42c42f2221906892ceb765dbcb1a51deeffd86d7" uuid = "79e6a3ab-5dfb-504d-930d-738a2a938a0e" version = "2.3.0" [[ArgCheck]] git-tree-sha1 = "dedbbb2ddb876f899585c4ec4433265e3017215a" uuid = "dce04be8-c92d-5529-be00-80e4d2c0e197" version = "2.1.0" [[Arpack]] deps = ["Arpack_jll", "Libdl", "LinearAlgebra"] git-tree-sha1 = "2ff92b71ba1747c5fdd541f8fc87736d82f40ec9" uuid = "7d9fca2a-8960-54d3-9f78-7d1dccf2cb97" version = "0.4.0" [[Arpack_jll]] deps = ["Libdl", "OpenBLAS_jll", "Pkg"] git-tree-sha1 = "e214a9b9bd1b4e1b4f15b22c0994862b66af7ff7" uuid = "68821587-b530-5797-8361-c406ea357684" version = "3.5.0+3" [[ArrayInterface]] deps = ["LinearAlgebra", "Requires", "SparseArrays"] git-tree-sha1 = "3b5bd474a90bee86b50f26268bbb044bb4d9ef83" uuid = "4fba245c-0d91-5ea0-9b3e-6abc04ee57a9" version = "2.14.9" [[Artifacts]] deps = ["Pkg"] git-tree-sha1 = "c30985d8821e0cd73870b17b0ed0ce6dc44cb744" uuid = "56f22d72-fd6d-98f1-02f0-08ddc0907c33" version = "1.3.0" [[AxisAlgorithms]] deps = ["LinearAlgebra", "Random", "SparseArrays", "WoodburyMatrices"] git-tree-sha1 = "a4d07a1c313392a77042855df46c5f534076fab9" uuid = "13072b0f-2c55-5437-9ae7-d433b7a33950" version = "1.0.0" [[AxisArrays]] deps = ["Dates", "IntervalSets", "IterTools", "RangeArrays"] git-tree-sha1 = "f31f50712cbdf40ee8287f0443b57503e34122ef" uuid = "39de3d68-74b9-583c-8d2d-e117c070f3a9" version = "0.4.3" [[BFloat16s]] deps = ["LinearAlgebra", "Test"] git-tree-sha1 = "4af69e205efc343068dc8722b8dfec1ade89254a" uuid = "ab4f0b2a-ad5b-11e8-123f-65d77653426b" version = "0.1.0" [[BangBang]] deps = ["Compat", "ConstructionBase", "Future", "InitialValues", "LinearAlgebra", "Requires", "Setfield", "Tables", "ZygoteRules"] git-tree-sha1 = "f42321255afc37da855b6cd9f2a1fc36c017ceee" uuid = "198e06fe-97b7-11e9-32a5-e1d131e6ad66" version = "0.3.29" [[Base64]] uuid = "2a0f44e3-6c83-55bd-87e4-b1978d98bd5f" [[BenchmarkTools]] deps = ["JSON", "Logging", "Printf", "Statistics", "UUIDs"] git-tree-sha1 = "9e62e66db34540a0c919d72172cc2f642ac71260" uuid = "6e4b80f9-dd63-53aa-95a3-0cdb28fa8baf" version = "0.5.0" [[Bzip2_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "c3598e525718abcc440f69cc6d5f60dda0a1b61e" uuid = "6e34b625-4abd-537c-b88f-471c36dfa7a0" version = "1.0.6+5" [[CEnum]] git-tree-sha1 = "215a9aa4a1f23fbd05b92769fdd62559488d70e9" uuid = "fa961155-64e5-5f13-b03f-caf6b980ea82" version = "0.4.1" [[CUDA]] deps = ["AbstractFFTs", "Adapt", "BFloat16s", "CEnum", "DataStructures", "ExprTools", "GPUArrays", "GPUCompiler", "LLVM", "Libdl", "LinearAlgebra", "Logging", "MacroTools", "NNlib", "Pkg", "Printf", "Random", "Reexport", "Requires", "SparseArrays", "Statistics", "TimerOutputs"] git-tree-sha1 = "7663b61782b569b03fba91d330a5ed2f86cd4cb8" uuid = "052768ef-5323-5732-b1bb-66c8b64840ba" version = "2.3.0" [[Cairo_jll]] deps = ["Artifacts", "Bzip2_jll", "Fontconfig_jll", "FreeType2_jll", "Glib_jll", "JLLWrappers", "LZO_jll", "Libdl", "Pixman_jll", "Pkg", "Xorg_libXext_jll", "Xorg_libXrender_jll", "Zlib_jll", "libpng_jll"] git-tree-sha1 = "e2f47f6d8337369411569fd45ae5753ca10394c6" uuid = "83423d85-b0ee-5818-9007-b63ccbeb887a" version = "1.16.0+6" [[CategoricalArrays]] deps = ["DataAPI", "Future", "JSON", "Missings", "Printf", "Statistics", "StructTypes", "Unicode"] git-tree-sha1 = "5861101791fa76fafe8dddefd70ffbfe4e33ecae" uuid = "324d7699-5711-5eae-9e2f-1d82baa6b597" version = "0.9.0" [[ChainRulesCore]] deps = ["LinearAlgebra", "MuladdMacro", "SparseArrays"] git-tree-sha1 = "15081c431bb25848ad9b0d172a65794f3a3e197a" uuid = "d360d2e6-b24c-11e9-a2a3-2a2ae2dbcce4" version = "0.9.24" [[ClusterManagers]] deps = ["Distributed", "Logging", "Pkg", "Sockets"] git-tree-sha1 = "d0e2f616eb67985fd186f66f3ba09047befd3c24" uuid = "34f1f09b-3a8b-5176-ab39-66d58a4d544e" version = "0.4.0" [[Clustering]] deps = ["Distances", "LinearAlgebra", "NearestNeighbors", "Printf", "SparseArrays", "Statistics", "StatsBase"] git-tree-sha1 = "75479b7df4167267d75294d14b58244695beb2ac" uuid = "aaaa29a8-35af-508c-8bc3-b662a17a0fe5" version = "0.14.2" [[CodeTracking]] deps = ["InteractiveUtils", "UUIDs"] git-tree-sha1 = "8ad457cfeb0bca98732c97958ef81000a543e73e" uuid = "da1fd8a2-8d9e-5ec2-8556-3022fb5608a2" version = "1.0.5" [[CodecZlib]] deps = ["TranscodingStreams", "Zlib_jll"] git-tree-sha1 = "ded953804d019afa9a3f98981d99b33e3db7b6da" uuid = "944b1d66-785c-5afd-91f1-9de20f533193" version = "0.7.0" [[ColorSchemes]] deps = ["ColorTypes", "Colors", "FixedPointNumbers", "Random", "StaticArrays"] git-tree-sha1 = "3141757b5832ee7a0386db87997ee5a23ff20f4d" uuid = "35d6a980-a343-548e-a6ea-1d62b119f2f4" version = "3.10.2" [[ColorTypes]] deps = ["FixedPointNumbers", "Random"] git-tree-sha1 = "4bffea7ed1a9f0f3d1a131bbcd4b925548d75288" uuid = "3da002f7-5984-5a60-b8a6-cbb66c0b333f" version = "0.10.9" [[Colors]] deps = ["ColorTypes", "FixedPointNumbers", "InteractiveUtils", "Reexport"] git-tree-sha1 = "ac5f2213e56ed8a34a3dd2f681f4df1166b34929" uuid = "5ae59095-9a9b-59fe-a467-6f913c188581" version = "0.12.6" [[Combinatorics]] git-tree-sha1 = "08c8b6831dc00bfea825826be0bc8336fc369860" uuid = "861a8166-3701-5b0c-9a16-15d98fcdc6aa" version = "1.0.2" [[CommonSubexpressions]] deps = ["MacroTools", "Test"] git-tree-sha1 = "7b8a93dba8af7e3b42fecabf646260105ac373f7" uuid = "bbf7d656-a473-5ed7-a52c-81e309532950" version = "0.3.0" [[Compat]] deps = ["Base64", "Dates", "DelimitedFiles", "Distributed", "InteractiveUtils", "LibGit2", "Libdl", "LinearAlgebra", "Markdown", "Mmap", "Pkg", "Printf", "REPL", "Random", "SHA", "Serialization", "SharedArrays", "Sockets", "SparseArrays", "Statistics", "Test", "UUIDs", "Unicode"] git-tree-sha1 = "919c7f3151e79ff196add81d7f4e45d91bbf420b" uuid = "34da2185-b29b-5c13-b0c7-acf172513d20" version = "3.25.0" [[CompilerSupportLibraries_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "8e695f735fca77e9708e795eda62afdb869cbb70" uuid = "e66e0078-7015-5450-92f7-15fbd957f2ae" version = "0.3.4+0" [[CompositionsBase]] git-tree-sha1 = "f3955eb38944e5dd0fabf8ca1e267d94941d34a5" uuid = "a33af91c-f02d-484b-be07-31d278c5ca2b" version = "0.1.0" [[ConsoleProgressMonitor]] deps = ["Logging", "ProgressMeter"] git-tree-sha1 = "3ab7b2136722890b9af903859afcf457fa3059e8" uuid = "88cd18e8-d9cc-4ea6-8889-5259c0d15c8b" version = "0.1.2" [[ConstructionBase]] git-tree-sha1 = "a2a6a5fea4d6f730ec4c18a76d27ec10e8ec1c50" uuid = "187b0558-2788-49d3-abe0-74a17ed4e7c9" version = "1.0.0" [[Contour]] deps = ["StaticArrays"] git-tree-sha1 = "9f02045d934dc030edad45944ea80dbd1f0ebea7" uuid = "d38c429a-6771-53c6-b99e-75d170b6e991" version = "0.5.7" [[Crayons]] git-tree-sha1 = "3f71217b538d7aaee0b69ab47d9b7724ca8afa0d" uuid = "a8cc5b0e-0ffa-5ad4-8c14-923d3ee1735f" version = "4.0.4" [[DataAPI]] git-tree-sha1 = "ad84f52c0b8f05aa20839484dbaf01690b41ff84" uuid = "9a962f9c-6df0-11e9-0e5d-c546b8b5ee8a" version = "1.4.0" [[DataFrames]] deps = ["CategoricalArrays", "Compat", "DataAPI", "Future", "InvertedIndices", "IteratorInterfaceExtensions", "LinearAlgebra", "Markdown", "Missings", "PooledArrays", "PrettyTables", "Printf", "REPL", "Reexport", "SortingAlgorithms", "Statistics", "TableTraits", "Tables", "Unicode"] git-tree-sha1 = "b46e1deb4592a5df7416b10dfcd6b01fb194ab9a" uuid = "a93c6f00-e57d-5684-b7b6-d8193f3e46c0" version = "0.22.2" [[DataStructures]] deps = ["Compat", "InteractiveUtils", "OrderedCollections"] git-tree-sha1 = "fb0aa371da91c1ff9dc7fbed6122d3e411420b9c" uuid = "864edb3b-99cc-5e75-8d2d-829cb0a9cfe8" version = "0.18.8" [[DataValueInterfaces]] git-tree-sha1 = "bfc1187b79289637fa0ef6d4436ebdfe6905cbd6" uuid = "e2d170a0-9d28-54be-80f0-106bbe20a464" version = "1.0.0" [[DataValues]] deps = ["DataValueInterfaces", "Dates"] git-tree-sha1 = "d88a19299eba280a6d062e135a43f00323ae70bf" uuid = "e7dc6d0d-1eca-5fa6-8ad6-5aecde8b7ea5" version = "0.4.13" [[Dates]] deps = ["Printf"] uuid = "ade2ca70-3891-5945-98fb-dc099432e06a" [[DefineSingletons]] git-tree-sha1 = "1a356f194281dff9ef1119faa9125a0d4e210729" uuid = "244e2a9f-e319-4986-a169-4d1fe445cd52" version = "0.1.0" [[DelimitedFiles]] deps = ["Mmap"] uuid = "8bb1440f-4735-579b-a4ab-409b98df4dab" [[DiffResults]] deps = ["StaticArrays"] git-tree-sha1 = "c18e98cba888c6c25d1c3b048e4b3380ca956805" uuid = "163ba53b-c6d8-5494-b064-1a9d43ac40c5" version = "1.0.3" [[DiffRules]] deps = ["NaNMath", "Random", "SpecialFunctions"] git-tree-sha1 = "214c3fcac57755cfda163d91c58893a8723f93e9" uuid = "b552c78f-8df3-52c6-915a-8e097449b14b" version = "1.0.2" [[Distances]] deps = ["LinearAlgebra", "Statistics"] git-tree-sha1 = "e8b13ba5f166e11df2de6fc283e5db7864245df0" uuid = "b4f34e82-e78d-54a5-968a-f98e89d6e8f7" version = "0.10.0" [[Distributed]] deps = ["Random", "Serialization", "Sockets"] uuid = "8ba89e20-285c-5b6f-9357-94700520ee1b" [[DistributedArrays]] deps = ["Distributed", "LinearAlgebra", "Primes", "Random", "Serialization", "SparseArrays", "Statistics"] git-tree-sha1 = "ab2f313a5ef4db9d127b8fae4d922e268db1552f" uuid = "aaf54ef3-cdf8-58ed-94cc-d582ad619b94" version = "0.6.5" [[DistributedTopicModels]] deps = ["CUDA", "ClusterManagers", "Distributed", "DistributedArrays", "Distributions", "Documenter", "LinearAlgebra", "Random", "SharedArrays", "Statistics"] path = "dev/DistributedTopicModels" uuid = "84443b02-f120-4e83-b3f9-d8b671af1397" version = "0.1.0" [[Distributions]] deps = ["FillArrays", "LinearAlgebra", "PDMats", "Printf", "QuadGK", "Random", "SparseArrays", "SpecialFunctions", "StaticArrays", "Statistics", "StatsBase", "StatsFuns"] git-tree-sha1 = "2cce211af0abaa01354904e2af2232a4431d8b14" uuid = "31c24e10-a181-5473-b8eb-7969acd0382f" version = "0.24.8" [[DocStringExtensions]] deps = ["LibGit2", "Markdown", "Pkg", "Test"] git-tree-sha1 = "50ddf44c53698f5e784bbebb3f4b21c5807401b1" uuid = "ffbed154-4ef7-542d-bbb7-c09d3a79fcae" version = "0.8.3" [[Documenter]] deps = ["Base64", "Dates", "DocStringExtensions", "IOCapture", "InteractiveUtils", "JSON", "LibGit2", "Logging", "Markdown", "REPL", "Test", "Unicode"] git-tree-sha1 = "b7715ae18be02110a8cf9cc8ed2ccdb1e3e3aba2" uuid = "e30172f5-a6a5-5a46-863b-614d45cd2de4" version = "0.26.1" [[EarCut_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "92d8f9f208637e8d2d28c664051a00569c01493d" uuid = "5ae413db-bbd1-5e63-b57d-d24a61df00f5" version = "2.1.5+1" [[EllipsisNotation]] git-tree-sha1 = "18ee049accec8763be17a933737c1dd0fdf8673a" uuid = "da5c29d0-fa7d-589e-88eb-ea29b0a81949" version = "1.0.0" [[Expat_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "1402e52fcda25064f51c77a9655ce8680b76acf0" uuid = "2e619515-83b5-522b-bb60-26c02a35a201" version = "2.2.7+6" [[ExprTools]] git-tree-sha1 = "10407a39b87f29d47ebaca8edbc75d7c302ff93e" uuid = "e2ba6199-217a-4e67-a87a-7c52f15ade04" version = "0.1.3" [[FFMPEG]] deps = ["FFMPEG_jll", "x264_jll"] git-tree-sha1 = "9a73ffdc375be61b0e4516d83d880b265366fe1f" uuid = "c87230d0-a227-11e9-1b43-d7ebe4e7570a" version = "0.4.0" [[FFMPEG_jll]] deps = ["Artifacts", "Bzip2_jll", "FreeType2_jll", "FriBidi_jll", "JLLWrappers", "LAME_jll", "LibVPX_jll", "Libdl", "Ogg_jll", "OpenSSL_jll", "Opus_jll", "Pkg", "Zlib_jll", "libass_jll", "libfdk_aac_jll", "libvorbis_jll", "x264_jll", "x265_jll"] git-tree-sha1 = "3cc57ad0a213808473eafef4845a74766242e05f" uuid = "b22a6f82-2f65-5046-a5b2-351ab43fb4e5" version = "4.3.1+4" [[FFTW]] deps = ["AbstractFFTs", "FFTW_jll", "IntelOpenMP_jll", "Libdl", "LinearAlgebra", "MKL_jll", "Reexport"] git-tree-sha1 = "8b7c16b56936047ca41bf25effa137ae0b381ae8" uuid = "7a1cc6ca-52ef-59f5-83cd-3a7055c09341" version = "1.2.4" [[FFTW_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "5a0d4b6a22a34d17d53543bd124f4b08ed78e8b0" uuid = "f5851436-0d7a-5f13-b9de-f02708fd171a" version = "3.3.9+7" [[FileIO]] deps = ["Pkg"] git-tree-sha1 = "fee8955b9dfa7bec67117ef48085fb2b559b9c22" uuid = "5789e2e9-d7fb-5bc7-8068-2c6fae9b9549" version = "1.4.5" [[FileWatching]] uuid = "7b1f6079-737a-58dc-b8bc-7a2ca5c1b5ee" [[FillArrays]] deps = ["LinearAlgebra", "Random", "SparseArrays"] git-tree-sha1 = "ff537e5a3cba92fb48f30fec46723510450f2c0e" uuid = "1a297f60-69ca-5386-bcde-b61e274b549b" version = "0.10.2" [[FiniteDiff]] deps = ["ArrayInterface", "LinearAlgebra", "Requires", "SparseArrays", "StaticArrays"] git-tree-sha1 = "7f7216e0eb46c20ee8ddab5c8f9a262ed72587b6" uuid = "6a86dc24-6348-571c-b903-95158fe2bd41" version = "2.7.2" [[FixedPointNumbers]] deps = ["Statistics"] git-tree-sha1 = "335bfdceacc84c5cdf16aadc768aa5ddfc5383cc" uuid = "53c48c17-4a7d-5ca2-90c5-79b7896eea93" version = "0.8.4" [[Fontconfig_jll]] deps = ["Artifacts", "Bzip2_jll", "Expat_jll", "FreeType2_jll", "JLLWrappers", "Libdl", "Libuuid_jll", "Pkg", "Zlib_jll"] git-tree-sha1 = "35895cf184ceaab11fd778b4590144034a167a2f" uuid = "a3f928ae-7b40-5064-980b-68af3947d34b" version = "2.13.1+14" [[Formatting]] deps = ["Printf"] git-tree-sha1 = "8339d61043228fdd3eb658d86c926cb282ae72a8" uuid = "59287772-0a20-5a39-b81b-1366585eb4c0" version = "0.4.2" [[ForwardDiff]] deps = ["CommonSubexpressions", "DiffResults", "DiffRules", "NaNMath", "Random", "SpecialFunctions", "StaticArrays"] git-tree-sha1 = "8de2519a83c6c1c2442c2f481dd9a8364855daf4" uuid = "f6369f11-7733-5829-9624-2563aa707210" version = "0.10.14" [[FreeType2_jll]] deps = ["Artifacts", "Bzip2_jll", "JLLWrappers", "Libdl", "Pkg", "Zlib_jll"] git-tree-sha1 = "cbd58c9deb1d304f5a245a0b7eb841a2560cfec6" uuid = "d7e528f0-a631-5988-bf34-fe36492bcfd7" version = "2.10.1+5" [[FriBidi_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "0d20aed5b14dd4c9a2453c1b601d08e1149679cc" uuid = "559328eb-81f9-559d-9380-de523a88c83c" version = "1.0.5+6" [[Future]] deps = ["Random"] uuid = "9fa8497b-333b-5362-9e8d-4d0656e87820" [[GLFW_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Libglvnd_jll", "Pkg", "Xorg_libXcursor_jll", "Xorg_libXi_jll", "Xorg_libXinerama_jll", "Xorg_libXrandr_jll"] git-tree-sha1 = "a1bbf700b5388bffc3d882f4f4d625cf1c714fd7" uuid = "0656b61e-2033-5cc2-a64a-77c0f6c09b89" version = "3.3.2+1" [[GPUArrays]] deps = ["AbstractFFTs", "Adapt", "LinearAlgebra", "Printf", "Random", "Serialization"] git-tree-sha1 = "2c1dd57bca7ba0b3b4bf81d9332aeb81b154ef4c" uuid = "0c68f7d7-f131-5f86-a1c3-88cf8149b2d7" version = "6.1.2" [[GPUCompiler]] deps = ["DataStructures", "InteractiveUtils", "LLVM", "Libdl", "Scratch", "Serialization", "TimerOutputs", "UUIDs"] git-tree-sha1 = "c853c810b52a80f9aad79ab109207889e57f41ef" uuid = "61eb1bfa-7361-4325-ad38-22787b887f55" version = "0.8.3" [[GR]] deps = ["Base64", "DelimitedFiles", "GR_jll", "HTTP", "JSON", "LinearAlgebra", "Pkg", "Printf", "Random", "Serialization", "Sockets", "Test", "UUIDs"] git-tree-sha1 = "b90b826782cb3ac5b7a7f41b3fd0113180257ed4" uuid = "28b8d3ca-fb5f-59d9-8090-bfdbd6d07a71" version = "0.53.0" [[GR_jll]] deps = ["Artifacts", "Bzip2_jll", "Cairo_jll", "FFMPEG_jll", "Fontconfig_jll", "GLFW_jll", "JLLWrappers", "JpegTurbo_jll", "Libdl", "Libtiff_jll", "Pixman_jll", "Pkg", "Qt_jll", "Zlib_jll", "libpng_jll"] git-tree-sha1 = "8aee6fa096b0cbdb05e71750c978b96a08c78951" uuid = "d2c73de3-f751-5644-a686-071e5b155ba9" version = "0.53.0+0" [[GZip]] deps = ["Libdl"] git-tree-sha1 = "039be665faf0b8ae36e089cd694233f5dee3f7d6" uuid = "92fee26a-97fe-5a0c-ad85-20a5f3185b63" version = "0.5.1" [[GeometryBasics]] deps = ["EarCut_jll", "IterTools", "LinearAlgebra", "StaticArrays", "StructArrays", "Tables"] git-tree-sha1 = "876f77f0d3253e882ff588af1c95d0e4a86c9766" uuid = "5c1252a2-5f33-56bf-86c9-59e7332b4326" version = "0.3.5" [[Gettext_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Libiconv_jll", "Pkg", "XML2_jll"] git-tree-sha1 = "8c14294a079216000a0bdca5ec5a447f073ddc9d" uuid = "78b55507-aeef-58d4-861c-77aaff3498b1" version = "0.20.1+7" [[Glib_jll]] deps = ["Artifacts", "Gettext_jll", "JLLWrappers", "Libdl", "Libffi_jll", "Libiconv_jll", "Libmount_jll", "PCRE_jll", "Pkg", "Zlib_jll"] git-tree-sha1 = "04690cc5008b38ecbdfede949220bc7d9ba26397" uuid = "7746bdde-850d-59dc-9ae8-88ece973131d" version = "2.59.0+4" [[Grisu]] git-tree-sha1 = "03d381f65183cb2d0af8b3425fde97263ce9a995" uuid = "42e2da0e-8278-4e71-bc24-59509adca0fe" version = "1.0.0" [[HTTP]] deps = ["Base64", "Dates", "IniFile", "MbedTLS", "Sockets"] git-tree-sha1 = "c7ec02c4c6a039a98a15f955462cd7aea5df4508" uuid = "cd3eb016-35fb-5094-929b-558a96fad6f3" version = "0.8.19" [[IOCapture]] deps = ["Logging"] git-tree-sha1 = "377252859f740c217b936cebcd918a44f9b53b59" uuid = "b5f81e59-6552-4d32-b1f0-c071b021bf89" version = "0.1.1" [[IniFile]] deps = ["Test"] git-tree-sha1 = "098e4d2c533924c921f9f9847274f2ad89e018b8" uuid = "83e8ac13-25f8-5344-8a64-a9f2b223428f" version = "0.5.0" [[InitialValues]] git-tree-sha1 = "26c8832afd63ac558b98a823265856670d898b6c" uuid = "22cec73e-a1b8-11e9-2c92-598750a2cf9c" version = "0.2.10" [[IntelOpenMP_jll]] deps = ["Libdl", "Pkg"] git-tree-sha1 = "fb8e1c7a5594ba56f9011310790e03b5384998d6" uuid = "1d5cc7b8-4909-519e-a0f8-d0f5ad9712d0" version = "2018.0.3+0" [[InteractiveUtils]] deps = ["Markdown"] uuid = "b77e0a4c-d291-57a0-90e8-8db25a27a240" [[Interpolations]] deps = ["AxisAlgorithms", "LinearAlgebra", "OffsetArrays", "Random", "Ratios", "SharedArrays", "SparseArrays", "StaticArrays", "WoodburyMatrices"] git-tree-sha1 = "eb1dd6d5b2275faaaa18533e0fc5f9171cec25fa" uuid = "a98d9a8b-a2ab-59e6-89dd-64a1c18fca59" version = "0.13.1" [[IntervalSets]] deps = ["Dates", "EllipsisNotation", "Statistics"] git-tree-sha1 = "93a6d78525feb0d3ee2a2ae83a7d04db1db5663f" uuid = "8197267c-284f-5f27-9208-e0e47529a953" version = "0.5.2" [[InvertedIndices]] deps = ["Test"] git-tree-sha1 = "15732c475062348b0165684ffe28e85ea8396afc" uuid = "41ab1584-1d38-5bbf-9106-f11c6c58b48f" version = "1.0.0" [[IterTools]] git-tree-sha1 = "05110a2ab1fc5f932622ffea2a003221f4782c18" uuid = "c8e1da08-722c-5040-9ed9-7db0dc04731e" version = "1.3.0" [[IteratorInterfaceExtensions]] git-tree-sha1 = "a3f24677c21f5bbe9d2a714f95dcd58337fb2856" uuid = "82899510-4779-5014-852e-03e436cf321d" version = "1.0.0" [[JLD2]] deps = ["CodecZlib", "DataStructures", "MacroTools", "Mmap", "Pkg", "Printf", "Requires", "UUIDs"] git-tree-sha1 = "0fd0b0043cae454eed05bccd6dcfcdddc3f21f7e" uuid = "033835bb-8acc-5ee8-8aae-3f567f8a3819" version = "0.3.1" [[JLLWrappers]] git-tree-sha1 = "c70593677bbf2c3ccab4f7500d0f4dacfff7b75c" uuid = "692b3bcd-3c85-4b1f-b108-f13ce0eb3210" version = "1.1.3" [[JSON]] deps = ["Dates", "Mmap", "Parsers", "Unicode"] git-tree-sha1 = "81690084b6198a2e1da36fcfda16eeca9f9f24e4" uuid = "682c06a0-de6a-54ab-a142-c8b1cf79cde6" version = "0.21.1" [[JpegTurbo_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "9aff0587d9603ea0de2c6f6300d9f9492bbefbd3" uuid = "aacddb02-875f-59d6-b918-886e6ef4fbf8" version = "2.0.1+3" [[JuliaInterpreter]] deps = ["CodeTracking", "InteractiveUtils", "Random", "UUIDs"] git-tree-sha1 = "fe18234f046a772069abdc8d29f073d8c0f092a5" uuid = "aa1ae85d-cabe-5617-a682-6adf51b2e16a" version = "0.8.8" [[KernelDensity]] deps = ["Distributions", "DocStringExtensions", "FFTW", "Interpolations", "StatsBase"] git-tree-sha1 = "09aeec87bdc9c1fa70d0b508dfa94a21acd280d9" uuid = "5ab0869b-81aa-558d-bb23-cbf5423bbe9b" version = "0.6.2" [[LAME_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "df381151e871f41ee86cee4f5f6fd598b8a68826" uuid = "c1c5ebd0-6772-5130-a774-d5fcae4a789d" version = "3.100.0+3" [[LLVM]] deps = ["CEnum", "Libdl", "Printf", "Unicode"] git-tree-sha1 = "a2101830a761d592b113129887fda626387f68d4" uuid = "929cbde3-209d-540e-8aea-75f648917ca0" version = "3.5.1" [[LZO_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "f128cd6cd05ffd6d3df0523ed99b90ff6f9b349a" uuid = "dd4b983a-f0e5-5f8d-a1b7-129d4a5fb1ac" version = "2.10.0+3" [[LaTeXStrings]] git-tree-sha1 = "c7aebfecb1a60d59c0fe023a68ec947a208b1e6b" uuid = "b964fa9f-0449-5b57-a5c2-d3ea65f4040f" version = "1.2.0" [[Latexify]] deps = ["Formatting", "InteractiveUtils", "LaTeXStrings", "MacroTools", "Markdown", "Printf", "Requires"] git-tree-sha1 = "3a0084cec7bf157edcb45a67fac0647f88fe5eaf" uuid = "23fbe1c1-3f47-55db-b15f-69d7ec21a316" version = "0.14.7" [[LeftChildRightSiblingTrees]] deps = ["AbstractTrees"] git-tree-sha1 = "71be1eb5ad19cb4f61fa8c73395c0338fd092ae0" uuid = "1d6d02ad-be62-4b6b-8a6d-2f90e265016e" version = "0.1.2" [[LibGit2]] deps = ["Printf"] uuid = "76f85450-5226-5b5a-8eaa-529ad045b433" [[LibVPX_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "85fcc80c3052be96619affa2fe2e6d2da3908e11" uuid = "dd192d2f-8180-539f-9fb4-cc70b1dcf69a" version = "1.9.0+1" [[Libdl]] uuid = "8f399da3-3557-5675-b5ff-fb832c97cbdb" [[Libffi_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "a2cd088a88c0d37eef7d209fd3d8712febce0d90" uuid = "e9f186c6-92d2-5b65-8a66-fee21dc1b490" version = "3.2.1+4" [[Libgcrypt_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Libgpg_error_jll", "Pkg"] git-tree-sha1 = "b391a18ab1170a2e568f9fb8d83bc7c780cb9999" uuid = "d4300ac3-e22c-5743-9152-c294e39db1e4" version = "1.8.5+4" [[Libglvnd_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libX11_jll", "Xorg_libXext_jll"] git-tree-sha1 = "7739f837d6447403596a75d19ed01fd08d6f56bf" uuid = "7e76a0d4-f3c7-5321-8279-8d96eeed0f29" version = "1.3.0+3" [[Libgpg_error_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "ec7f2e8ad5c9fa99fc773376cdbc86d9a5a23cb7" uuid = "7add5ba3-2f88-524e-9cd5-f83b8a55f7b8" version = "1.36.0+3" [[Libiconv_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "8e924324b2e9275a51407a4e06deb3455b1e359f" uuid = "94ce4f54-9a6c-5748-9c1c-f9c7231a4531" version = "1.16.0+7" [[Libmount_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "51ad0c01c94c1ce48d5cad629425035ad030bfd5" uuid = "4b2f31a3-9ecc-558c-b454-b3730dcb73e9" version = "2.34.0+3" [[Libtiff_jll]] deps = ["Artifacts", "JLLWrappers", "JpegTurbo_jll", "Libdl", "Pkg", "Zlib_jll", "Zstd_jll"] git-tree-sha1 = "291dd857901f94d683973cdf679984cdf73b56d0" uuid = "89763e89-9b03-5906-acba-b20f662cd828" version = "4.1.0+2" [[Libuuid_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "f879ae9edbaa2c74c922e8b85bb83cc84ea1450b" uuid = "38a345b3-de98-5d2b-a5d3-14cd9215e700" version = "2.34.0+7" [[LineSearches]] deps = ["LinearAlgebra", "NLSolversBase", "NaNMath", "Parameters", "Printf"] git-tree-sha1 = "f27132e551e959b3667d8c93eae90973225032dd" uuid = "d3d80556-e9d4-5f37-9878-2ab0fcc64255" version = "7.1.1" [[LinearAlgebra]] deps = ["Libdl"] uuid = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e" [[Logging]] uuid = "56ddb016-857b-54e1-b83d-db4d58db5568" [[LoggingExtras]] deps = ["Dates"] git-tree-sha1 = "03289aba73c0abc25ff0229bed60f2a4129cd15c" uuid = "e6f89c97-d47a-5376-807f-9c37f3926c36" version = "0.4.2" [[LoweredCodeUtils]] deps = ["JuliaInterpreter"] git-tree-sha1 = "f008f15264cc11de6de8cbdda3d4712dd152f0c3" uuid = "6f1432cf-f94c-5a45-995e-cdbf5db27b0b" version = "1.2.7" [[MCMCChains]] deps = ["AbstractFFTs", "AbstractMCMC", "AxisArrays", "Compat", "Distributions", "Formatting", "IteratorInterfaceExtensions", "LinearAlgebra", "MLJModelInterface", "NaturalSort", "PrettyTables", "Random", "RecipesBase", "Serialization", "SpecialFunctions", "Statistics", "StatsBase", "TableTraits", "Tables"] git-tree-sha1 = "8df14e3546bfb4fc05acfb1e932cb67387efa201" uuid = "c7f686f2-ff18-58e9-bc7b-31028e88f75d" version = "4.4.0" [[MKL_jll]] deps = ["IntelOpenMP_jll", "Libdl", "Pkg"] git-tree-sha1 = "eb540ede3aabb8284cb482aa41d00d6ca850b1f8" uuid = "856f044c-d86e-5d09-b602-aeab76dc8ba7" version = "2020.2.254+0" [[MLJModelInterface]] deps = ["Random", "ScientificTypes"] git-tree-sha1 = "a63e200c4d8bfb3820db9849cc1950a91ddad761" uuid = "e80e1ace-859a-464e-9ed9-23947d8ae3ea" version = "0.3.6" [[MacroTools]] deps = ["Markdown", "Random"] git-tree-sha1 = "6a8a2a625ab0dea913aba95c11370589e0239ff0" uuid = "1914dd2f-81c6-5fcd-8719-6d5c9610ff09" version = "0.5.6" [[Markdown]] deps = ["Base64"] uuid = "d6f4376e-aef5-505a-96c1-9c027394607a" [[MbedTLS]] deps = ["Dates", "MbedTLS_jll", "Random", "Sockets"] git-tree-sha1 = "1c38e51c3d08ef2278062ebceade0e46cefc96fe" uuid = "739be429-bea8-5141-9913-cc70e7f3736d" version = "1.0.3" [[MbedTLS_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "0eef589dd1c26a3ac9d753fe1a8bcad63f956fa6" uuid = "c8ffd9c3-330d-5841-b78e-0817d7145fa1" version = "2.16.8+1" [[Measures]] git-tree-sha1 = "e498ddeee6f9fdb4551ce855a46f54dbd900245f" uuid = "442fdcdd-2543-5da2-b0f3-8c86c306513e" version = "0.3.1" [[MicroCollections]] deps = ["BangBang", "Setfield"] git-tree-sha1 = "e991b6a9d38091c4a0d7cd051fcb57c05f98ac03" uuid = "128add7d-3638-4c79-886c-908ea0c25c34" version = "0.1.0" [[Missings]] deps = ["DataAPI"] git-tree-sha1 = "ed61674a0864832495ffe0a7e889c0da76b0f4c8" uuid = "e1d29d7a-bbdc-5cf2-9ac0-f12de2c33e28" version = "0.4.4" [[Mmap]] uuid = "a63ad114-7e13-5084-954f-fe012c677804" [[MuladdMacro]] git-tree-sha1 = "c6190f9a7fc5d9d5915ab29f2134421b12d24a68" uuid = "46d2c3a1-f734-5fdb-9937-b9b9aeba4221" version = "0.2.2" [[MultivariateStats]] deps = ["Arpack", "LinearAlgebra", "SparseArrays", "Statistics", "StatsBase"] git-tree-sha1 = "352fae519b447bf52e6de627b89f448bcd469e4e" uuid = "6f286f6a-111f-5878-ab1e-185364afe411" version = "0.7.0" [[NLSolversBase]] deps = ["DiffResults", "Distributed", "FiniteDiff", "ForwardDiff"] git-tree-sha1 = "39d6bc45e99c96e6995cbddac02877f9b61a1dd1" uuid = "d41bc354-129a-5804-8e4c-c37616107c6c" version = "7.7.1" [[NNlib]] deps = ["Compat", "Libdl", "LinearAlgebra", "Pkg", "Requires", "Statistics"] git-tree-sha1 = "2b7c3213ed4f2eed686f9f531f85d3ea2f75286f" uuid = "872c559c-99b0-510c-b3b7-b6c96a88d5cd" version = "0.7.9" [[NaNMath]] git-tree-sha1 = "bfe47e760d60b82b66b61d2d44128b62e3a369fb" uuid = "77ba4419-2d1f-58cd-9bb1-8ffee604a2e3" version = "0.3.5" [[NaturalSort]] git-tree-sha1 = "eda490d06b9f7c00752ee81cfa451efe55521e21" uuid = "c020b1a1-e9b0-503a-9c33-f039bfc54a85" version = "1.0.0" [[NearestNeighbors]] deps = ["Distances", "StaticArrays"] git-tree-sha1 = "9afd724797039125e8e2cc362098f01dab60bc3a" uuid = "b8a86587-4115-5ab1-83bc-aa920d37bbce" version = "0.4.8" [[Observables]] git-tree-sha1 = "635fe10760447cfa86f5118edf2f47eb864fb495" uuid = "510215fc-4207-5dde-b226-833fc4488ee2" version = "0.3.2" [[OffsetArrays]] deps = ["Adapt"] git-tree-sha1 = "b0cc1c42b63e30b759f4e1cf045ad8a51069d6cc" uuid = "6fe1bfb0-de20-5000-8ca7-80f57d26f881" version = "1.4.2" [[Ogg_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "a42c0f138b9ebe8b58eba2271c5053773bde52d0" uuid = "e7412a2a-1a6e-54c0-be00-318e2571c051" version = "1.3.4+2" [[OpenBLAS_jll]] deps = ["CompilerSupportLibraries_jll", "Libdl", "Pkg"] git-tree-sha1 = "0c922fd9634e358622e333fc58de61f05a048492" uuid = "4536629a-c528-5b80-bd46-f80d51c5b363" version = "0.3.9+5" [[OpenSSL_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "71bbbc616a1d710879f5a1021bcba65ffba6ce58" uuid = "458c3c95-2e84-50aa-8efc-19380b2a3a95" version = "1.1.1+6" [[OpenSpecFun_jll]] deps = ["Artifacts", "CompilerSupportLibraries_jll", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "9db77584158d0ab52307f8c04f8e7c08ca76b5b3" uuid = "efe28fd5-8261-553b-a9e1-b2916fc3738e" version = "0.5.3+4" [[Optim]] deps = ["Compat", "FillArrays", "LineSearches", "LinearAlgebra", "NLSolversBase", "NaNMath", "Parameters", "PositiveFactorizations", "Printf", "SparseArrays", "StatsBase"] git-tree-sha1 = "bc382053437572df944d02be10b5142808afab7e" uuid = "429524aa-4258-5aef-a3af-852621145aeb" version = "1.2.1" [[Opus_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "f9d57f4126c39565e05a2b0264df99f497fc6f37" uuid = "91d4177d-7536-5919-b921-800302f37372" version = "1.3.1+3" [[OrderedCollections]] git-tree-sha1 = "cf59cfed2e2c12e8a2ff0a4f1e9b2cd8650da6db" uuid = "bac558e1-5e72-5ebc-8fee-abe8a469f55d" version = "1.3.2" [[PCRE_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "1b556ad51dceefdbf30e86ffa8f528b73c7df2bb" uuid = "2f80f16e-611a-54ab-bc61-aa92de5b98fc" version = "8.42.0+4" [[PDMats]] deps = ["LinearAlgebra", "SparseArrays", "SuiteSparse", "Test"] git-tree-sha1 = "95a4038d1011dfdbde7cecd2ad0ac411e53ab1bc" uuid = "90014a1f-27ba-587c-ab20-58faa44d9150" version = "0.10.1" [[ParallelKMeans]] deps = ["Distances", "MLJModelInterface", "Random", "StatsBase", "UnsafeArrays"] git-tree-sha1 = "3174da4811ffa7e0add7f5b8d1b44525189503e2" uuid = "42b8e9d4-006b-409a-8472-7f34b3fb58af" version = "0.1.9" [[Parameters]] deps = ["OrderedCollections", "UnPack"] git-tree-sha1 = "38b2e970043613c187bd56a995fe2e551821eb4a" uuid = "d96e819e-fc66-5662-9728-84c9c7592b0a" version = "0.12.1" [[Parsers]] deps = ["Dates"] git-tree-sha1 = "50c9a9ed8c714945e01cd53a21007ed3865ed714" uuid = "69de0a69-1ddd-5017-9359-2bf0b02dc9f0" version = "1.0.15" [[Pixman_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "6a20a83c1ae86416f0a5de605eaea08a552844a3" uuid = "30392449-352a-5448-841d-b1acce4e97dc" version = "0.40.0+0" [[Pkg]] deps = ["Dates", "LibGit2", "Libdl", "Logging", "Markdown", "Printf", "REPL", "Random", "SHA", "UUIDs"] uuid = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f" [[PlotThemes]] deps = ["PlotUtils", "Requires", "Statistics"] git-tree-sha1 = "c6f5ea535551b3b16835134697f0c65d06c94b91" uuid = "ccf2f8ad-2431-5c83-bf29-c5338b663b6a" version = "2.0.0" [[PlotUtils]] deps = ["ColorSchemes", "Colors", "Dates", "Printf", "Random", "Reexport", "Statistics"] git-tree-sha1 = "6a59c282058f46967069972d74526a68d27a9012" uuid = "995b91a9-d308-5afd-9ec6-746e21dbc043" version = "1.0.8" [[Plots]] deps = ["Base64", "Contour", "Dates", "FFMPEG", "FixedPointNumbers", "GR", "GeometryBasics", "JSON", "Latexify", "LinearAlgebra", "Measures", "NaNMath", "PlotThemes", "PlotUtils", "Printf", "REPL", "Random", "RecipesBase", "RecipesPipeline", "Reexport", "Requires", "Scratch", "Showoff", "SparseArrays", "Statistics", "StatsBase", "UUIDs"] git-tree-sha1 = "173c7250ccd7c98615b04c669eb13fa7fab494b0" uuid = "91a5bcdd-55d7-5caf-9e0b-520d859cae80" version = "1.9.1" [[PooledArrays]] deps = ["DataAPI"] git-tree-sha1 = "b1333d4eced1826e15adbdf01a4ecaccca9d353c" uuid = "2dfb63ee-cc39-5dd5-95bd-886bf059d720" version = "0.5.3" [[PositiveFactorizations]] deps = ["LinearAlgebra"] git-tree-sha1 = "17275485f373e6673f7e7f97051f703ed5b15b20" uuid = "85a6dd25-e78a-55b7-8502-1745935b8125" version = "0.2.4" [[PrettyTables]] deps = ["Crayons", "Formatting", "Markdown", "Reexport", "Tables"] git-tree-sha1 = "237170206bf38a66fee4d845f4ae57f63788eeb0" uuid = "08abe8d2-0d0c-5749-adfa-8a2ac140af0d" version = "0.10.1" [[Primes]] deps = ["Test"] git-tree-sha1 = "ff1a2323cb468ec5f201838fcbe3c232266b1f95" uuid = "27ebfcd6-29c5-5fa9-bf4b-fb8fc14df3ae" version = "0.4.0" [[Printf]] deps = ["Unicode"] uuid = "de0858da-6303-5e67-8744-51eddeeeb8d7" [[ProgressLogging]] deps = ["Logging", "SHA", "UUIDs"] git-tree-sha1 = "59398022b661b6fd569f25de6b18fde39843196a" uuid = "33c8b6b6-d38a-422a-b730-caa89a2f386c" version = "0.1.3" [[ProgressMeter]] deps = ["Distributed", "Printf"] git-tree-sha1 = "45640774ee2efa24e52686dbdf895e88102e68fc" uuid = "92933f4c-e287-5a05-a399-4b506db050ca" version = "1.4.1" [[Qt_jll]] deps = ["Artifacts", "CompilerSupportLibraries_jll", "Fontconfig_jll", "Glib_jll", "JLLWrappers", "Libdl", "Pkg", "Xorg_libXext_jll", "Xorg_libxcb_jll", "Xorg_xcb_util_image_jll", "Xorg_xcb_util_keysyms_jll", "Xorg_xcb_util_renderutil_jll", "Xorg_xcb_util_wm_jll", "Zlib_jll", "xkbcommon_jll"] git-tree-sha1 = "c0efbd50dd55f6ac89ae5a81b114e54ab6754100" uuid = "ede63266-ebff-546c-83e0-1c6fb6d0efc8" version = "5.15.2+0" [[QuadGK]] deps = ["DataStructures", "LinearAlgebra"] git-tree-sha1 = "12fbe86da16df6679be7521dfb39fbc861e1dc7b" uuid = "1fd47b50-473d-5c70-9696-f719f8f3bcdc" version = "2.4.1" [[REPL]] deps = ["InteractiveUtils", "Markdown", "Sockets"] uuid = "3fa0cd96-eef1-5676-8a61-b3b8758bbffb" [[Random]] deps = ["Serialization"] uuid = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c" [[RangeArrays]] git-tree-sha1 = "b9039e93773ddcfc828f12aadf7115b4b4d225f5" uuid = "b3c3ace0-ae52-54e7-9d0b-2c1406fd6b9d" version = "0.3.2" [[Ratios]] git-tree-sha1 = "37d210f612d70f3f7d57d488cb3b6eff56ad4e41" uuid = "c84ed2f1-dad5-54f0-aa8e-dbefe2724439" version = "0.4.0" [[RecipesBase]] git-tree-sha1 = "b3fb709f3c97bfc6e948be68beeecb55a0b340ae" uuid = "3cdcf5f2-1ef4-517c-9805-6587b60abb01" version = "1.1.1" [[RecipesPipeline]] deps = ["Dates", "NaNMath", "PlotUtils", "RecipesBase"] git-tree-sha1 = "9ea2f5bf1b26918b16e9f885bb8e05206bfc2144" uuid = "01d81517-befc-4cb6-b9ec-a95719d0359c" version = "0.2.1" [[Reexport]] deps = ["Pkg"] git-tree-sha1 = "7b1d07f411bc8ddb7977ec7f377b97b158514fe0" uuid = "189a3867-3050-52da-a836-e630ba90ab69" version = "0.2.0" [[Requires]] deps = ["UUIDs"] git-tree-sha1 = "cfbac6c1ed70c002ec6361e7fd334f02820d6419" uuid = "ae029012-a4dd-5104-9daa-d747884805df" version = "1.1.2" [[Revise]] deps = ["CodeTracking", "Distributed", "FileWatching", "JuliaInterpreter", "LibGit2", "LoweredCodeUtils", "OrderedCollections", "Pkg", "REPL", "Requires", "UUIDs", "Unicode"] git-tree-sha1 = "176c817f5e5a9c78fd0d91483dadc88cc5805c41" uuid = "295af30f-e4ad-537b-8983-00126c2a3abe" version = "3.1.11" [[Rmath]] deps = ["Random", "Rmath_jll"] git-tree-sha1 = "86c5647b565873641538d8f812c04e4c9dbeb370" uuid = "79098fc4-a85e-5d69-aa6a-4863f24498fa" version = "0.6.1" [[Rmath_jll]] deps = ["Libdl", "Pkg"] git-tree-sha1 = "d76185aa1f421306dec73c057aa384bad74188f0" uuid = "f50d1b31-88e8-58de-be2c-1cc44531875f" version = "0.2.2+1" [[SHA]] uuid = "ea8e919c-243c-51af-8825-aaa63cd721ce" [[SafeTestsets]] deps = ["Test"] git-tree-sha1 = "36ebc5622c82eb9324005cc75e7e2cc51181d181" uuid = "1bc83da4-3b8d-516f-aca4-4fe02f6d838f" version = "0.0.1" [[ScientificTypes]] git-tree-sha1 = "1d3f5f8bdf5dd0c9951eb9c595ee08a728aec331" uuid = "321657f4-b219-11e9-178b-2701a2544e81" version = "1.1.1" [[Scratch]] deps = ["Dates"] git-tree-sha1 = "ad4b278adb62d185bbcb6864dc24959ab0627bf6" uuid = "6c6a2e73-6563-6170-7368-637461726353" version = "1.0.3" [[SentinelArrays]] deps = ["Dates", "Random"] git-tree-sha1 = "6ccde405cf0759eba835eb613130723cb8f10ff9" uuid = "91c51154-3ec4-41a3-a24f-3f23e20d615c" version = "1.2.16" [[Serialization]] uuid = "9e88b42a-f829-5b0c-bbe9-9e923198166b" [[Setfield]] deps = ["ConstructionBase", "Future", "MacroTools", "Requires"] git-tree-sha1 = "d5640fc570fb1b6c54512f0bd3853866bd298b3e" uuid = "efcf1570-3423-57d1-acb7-fd33fddbac46" version = "0.7.0" [[SharedArrays]] deps = ["Distributed", "Mmap", "Random", "Serialization"] uuid = "1a1011a3-84de-559e-8e89-a11a2f7dc383" [[Showoff]] deps = ["Dates", "Grisu"] git-tree-sha1 = "ee010d8f103468309b8afac4abb9be2e18ff1182" uuid = "992d4aef-0814-514b-bc4d-f2e9a6c4116f" version = "0.3.2" [[Sockets]] uuid = "6462fe0b-24de-5631-8697-dd941f90decc" [[SortingAlgorithms]] deps = ["DataStructures", "Random", "Test"] git-tree-sha1 = "03f5898c9959f8115e30bc7226ada7d0df554ddd" uuid = "a2af1166-a08f-5f64-846c-94a0d3cef48c" version = "0.3.1" [[SparseArrays]] deps = ["LinearAlgebra", "Random"] uuid = "2f01184e-e22b-5df5-ae63-d93ebab69eaf" [[SpecialFunctions]] deps = ["ChainRulesCore", "OpenSpecFun_jll"] git-tree-sha1 = "75394dbe2bd346beeed750fb02baa6445487b862" uuid = "276daf66-3868-5448-9aa4-cd146d93841b" version = "1.2.1" [[SplittablesBase]] deps = ["Setfield", "Test"] git-tree-sha1 = "ab80edcbd61a44a4dc489d06ead964a863c0a898" uuid = "171d559e-b47b-412a-8079-5efa626c420e" version = "0.1.10" [[StaticArrays]] deps = ["LinearAlgebra", "Random", "Statistics"] git-tree-sha1 = "9da72ed50e94dbff92036da395275ed114e04d49" uuid = "90137ffa-7385-5640-81b9-e52037218182" version = "1.0.1" [[Statistics]] deps = ["LinearAlgebra", "SparseArrays"] uuid = "10745b16-79ce-11e8-11f9-7d13ad32a3b2" [[StatsBase]] deps = ["DataAPI", "DataStructures", "LinearAlgebra", "Missings", "Printf", "Random", "SortingAlgorithms", "SparseArrays", "Statistics"] git-tree-sha1 = "7bab7d4eb46b225b35179632852b595a3162cb61" uuid = "2913bbd2-ae8a-5f71-8c99-4fb6c76f3a91" version = "0.33.2" [[StatsFuns]] deps = ["Rmath", "SpecialFunctions"] git-tree-sha1 = "3b9f665c70712af3264b61c27a7e1d62055dafd1" uuid = "4c63d2b9-4356-54db-8cca-17b64c39e42c" version = "0.9.6" [[StatsPlots]] deps = ["Clustering", "DataStructures", "DataValues", "Distributions", "Interpolations", "KernelDensity", "LinearAlgebra", "MultivariateStats", "Observables", "Plots", "RecipesBase", "RecipesPipeline", "Reexport", "StatsBase", "TableOperations", "Tables", "Widgets"] git-tree-sha1 = "0904a834846e7f4796636171fe002368e755dffc" uuid = "f3b207a7-027a-5e70-b257-86293d7955fd" version = "0.14.17" [[StructArrays]] deps = ["Adapt", "DataAPI", "Tables"] git-tree-sha1 = "8099ed9fb90b6e754d6ba8c6ed8670f010eadca0" uuid = "09ab397b-f2b6-538f-b94a-2f83cf4a842a" version = "0.4.4" [[StructTypes]] deps = ["Dates", "UUIDs"] git-tree-sha1 = "d94235fcdc4a09649f263365c5f7e4ed4ba6ed34" uuid = "856f2bd8-1eba-4b0a-8007-ebc267875bd4" version = "1.2.1" [[SuiteSparse]] deps = ["Libdl", "LinearAlgebra", "Serialization", "SparseArrays"] uuid = "4607b0f0-06f3-5cda-b6b1-a6196a1729e9" [[SupervisedOmics]] deps = ["Distributions", "Random", "SpecialFunctions"] path = "dev/SupervisedOmics" uuid = "7ab76c79-0253-45b8-b1d2-3fdc362146dd" version = "0.1.0" [[SyntheticMixtureData]] deps = ["Distributions", "LinearAlgebra", "Random", "SafeTestsets"] path = "dev/SyntheticMixtureData" uuid = "21788f52-8b02-4c2b-a987-7de384f153b0" version = "0.1.0" [[TableOperations]] deps = ["SentinelArrays", "Tables", "Test"] git-tree-sha1 = "85490cabedd41c56cf7574daec34769e0e2851b9" uuid = "ab02a1b2-a7df-11e8-156e-fb1833f50b87" version = "0.3.0" [[TableTraits]] deps = ["IteratorInterfaceExtensions"] git-tree-sha1 = "b1ad568ba658d8cbb3b892ed5380a6f3e781a81e" uuid = "3783bdb8-4a98-5b6b-af9a-565f29a5fe9c" version = "1.0.0" [[Tables]] deps = ["DataAPI", "DataValueInterfaces", "IteratorInterfaceExtensions", "LinearAlgebra", "TableTraits", "Test"] git-tree-sha1 = "240d19b8762006ff04b967bdd833269ad642d550" uuid = "bd369af6-aec1-5ad0-b16a-f7cc5008161c" version = "1.2.2" [[TerminalLoggers]] deps = ["LeftChildRightSiblingTrees", "Logging", "Markdown", "Printf", "ProgressLogging", "UUIDs"] git-tree-sha1 = "cbea752b5eef52a3e1188fb31580c3e4fa0cbc35" uuid = "5d786b92-1e48-4d6f-9151-6b4477ca9bed" version = "0.1.2" [[Test]] deps = ["Distributed", "InteractiveUtils", "Logging", "Random"] uuid = "8dfed614-e22c-5e08-85e1-65c5234f0b40" [[TimerOutputs]] deps = ["Printf"] git-tree-sha1 = "3318281dd4121ecf9713ce1383b9ace7d7476fdd" uuid = "a759f4b9-e2f1-59dc-863e-4aeb61b1ea8f" version = "0.5.7" [[TopicModels]] deps = ["CUDA", "Distributions", "LinearAlgebra", "Optim", "Random", "SpecialFunctions"] path = "dev/TopicModels" uuid = "e9825ca3-3499-4c9b-97dc-a93734876e50" version = "0.1.0" [[TranscodingStreams]] deps = ["Random", "Test"] git-tree-sha1 = "7c53c35547de1c5b9d46a4797cf6d8253807108c" uuid = "3bb67fe8-82b1-5028-8e26-92a6c54297fa" version = "0.9.5" [[Transducers]] deps = ["ArgCheck", "BangBang", "CompositionsBase", "DefineSingletons", "Distributed", "InitialValues", "Logging", "Markdown", "MicroCollections", "Requires", "Setfield", "SplittablesBase", "Tables"] git-tree-sha1 = "80f9fad2026c304f391198d391a0c698b666b201" uuid = "28d57a85-8fef-5791-bfe6-a80928e7c999" version = "0.4.53" [[UUIDs]] deps = ["Random", "SHA"] uuid = "cf7118a7-6976-5b1a-9a39-7adc72f591a4" [[UnPack]] git-tree-sha1 = "387c1f73762231e86e0c9c5443ce3b4a0a9a0c2b" uuid = "3a884ed6-31ef-47d7-9d2a-63182c4928ed" version = "1.0.2" [[Unicode]] uuid = "4ec0a83e-493e-50e2-b9ac-8f72acf5a8f5" [[UnsafeArrays]] git-tree-sha1 = "9740b414f85ec2fa9135066f81b1fb14212befd6" uuid = "c4a57d5a-5b31-53a6-b365-19f8c011fbd6" version = "1.0.1" [[Wayland_jll]] deps = ["Artifacts", "Expat_jll", "JLLWrappers", "Libdl", "Libffi_jll", "Pkg", "XML2_jll"] git-tree-sha1 = "dc643a9b774da1c2781413fd7b6dcd2c56bb8056" uuid = "a2964d1f-97da-50d4-b82a-358c7fce9d89" version = "1.17.0+4" [[Wayland_protocols_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Wayland_jll"] git-tree-sha1 = "2839f1c1296940218e35df0bbb220f2a79686670" uuid = "2381bf8a-dfd0-557d-9999-79630e7b1b91" version = "1.18.0+4" [[Widgets]] deps = ["Colors", "Dates", "Observables", "OrderedCollections"] git-tree-sha1 = "fc0feda91b3fef7fe6948ee09bb628f882b49ca4" uuid = "cc8bc4a8-27d6-5769-a93b-9d913e69aa62" version = "0.6.2" [[WoodburyMatrices]] deps = ["LinearAlgebra", "SparseArrays"] git-tree-sha1 = "59e2ad8fd1591ea019a5259bd012d7aee15f995c" uuid = "efce3f68-66dc-5838-9240-27a6d6f5f9b6" version = "0.5.3" [[XML2_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Libiconv_jll", "Pkg", "Zlib_jll"] git-tree-sha1 = "be0db24f70aae7e2b89f2f3092e93b8606d659a6" uuid = "02c8fc9c-b97f-50b9-bbe4-9be30ff0a78a" version = "2.9.10+3" [[XSLT_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Libgcrypt_jll", "Pkg", "XML2_jll"] git-tree-sha1 = "2b3eac39df218762d2d005702d601cd44c997497" uuid = "aed1982a-8fda-507f-9586-7b0439959a61" version = "1.1.33+4" [[Xorg_libX11_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libxcb_jll", "Xorg_xtrans_jll"] git-tree-sha1 = "5be649d550f3f4b95308bf0183b82e2582876527" uuid = "4f6342f7-b3d2-589e-9d20-edeb45f2b2bc" version = "1.6.9+4" [[Xorg_libXau_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "4e490d5c960c314f33885790ed410ff3a94ce67e" uuid = "0c0b7dd1-d40b-584c-a123-a41640f87eec" version = "1.0.9+4" [[Xorg_libXcursor_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libXfixes_jll", "Xorg_libXrender_jll"] git-tree-sha1 = "12e0eb3bc634fa2080c1c37fccf56f7c22989afd" uuid = "935fb764-8cf2-53bf-bb30-45bb1f8bf724" version = "1.2.0+4" [[Xorg_libXdmcp_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "4fe47bd2247248125c428978740e18a681372dd4" uuid = "a3789734-cfe1-5b06-b2d0-1dd0d9d62d05" version = "1.1.3+4" [[Xorg_libXext_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libX11_jll"] git-tree-sha1 = "b7c0aa8c376b31e4852b360222848637f481f8c3" uuid = "1082639a-0dae-5f34-9b06-72781eeb8cb3" version = "1.3.4+4" [[Xorg_libXfixes_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libX11_jll"] git-tree-sha1 = "0e0dc7431e7a0587559f9294aeec269471c991a4" uuid = "d091e8ba-531a-589c-9de9-94069b037ed8" version = "5.0.3+4" [[Xorg_libXi_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libXext_jll", "Xorg_libXfixes_jll"] git-tree-sha1 = "89b52bc2160aadc84d707093930ef0bffa641246" uuid = "a51aa0fd-4e3c-5386-b890-e753decda492" version = "1.7.10+4" [[Xorg_libXinerama_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libXext_jll"] git-tree-sha1 = "26be8b1c342929259317d8b9f7b53bf2bb73b123" uuid = "d1454406-59df-5ea1-beac-c340f2130bc3" version = "1.1.4+4" [[Xorg_libXrandr_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libXext_jll", "Xorg_libXrender_jll"] git-tree-sha1 = "34cea83cb726fb58f325887bf0612c6b3fb17631" uuid = "ec84b674-ba8e-5d96-8ba1-2a689ba10484" version = "1.5.2+4" [[Xorg_libXrender_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libX11_jll"] git-tree-sha1 = "19560f30fd49f4d4efbe7002a1037f8c43d43b96" uuid = "ea2f1a96-1ddc-540d-b46f-429655e07cfa" version = "0.9.10+4" [[Xorg_libpthread_stubs_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "6783737e45d3c59a4a4c4091f5f88cdcf0908cbb" uuid = "14d82f49-176c-5ed1-bb49-ad3f5cbd8c74" version = "0.1.0+3" [[Xorg_libxcb_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "XSLT_jll", "Xorg_libXau_jll", "Xorg_libXdmcp_jll", "Xorg_libpthread_stubs_jll"] git-tree-sha1 = "daf17f441228e7a3833846cd048892861cff16d6" uuid = "c7cfdc94-dc32-55de-ac96-5a1b8d977c5b" version = "1.13.0+3" [[Xorg_libxkbfile_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libX11_jll"] git-tree-sha1 = "926af861744212db0eb001d9e40b5d16292080b2" uuid = "cc61e674-0454-545c-8b26-ed2c68acab7a" version = "1.1.0+4" [[Xorg_xcb_util_image_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_xcb_util_jll"] git-tree-sha1 = "0fab0a40349ba1cba2c1da699243396ff8e94b97" uuid = "12413925-8142-5f55-bb0e-6d7ca50bb09b" version = "0.4.0+1" [[Xorg_xcb_util_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libxcb_jll"] git-tree-sha1 = "e7fd7b2881fa2eaa72717420894d3938177862d1" uuid = "2def613f-5ad1-5310-b15b-b15d46f528f5" version = "0.4.0+1" [[Xorg_xcb_util_keysyms_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_xcb_util_jll"] git-tree-sha1 = "d1151e2c45a544f32441a567d1690e701ec89b00" uuid = "975044d2-76e6-5fbe-bf08-97ce7c6574c7" version = "0.4.0+1" [[Xorg_xcb_util_renderutil_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_xcb_util_jll"] git-tree-sha1 = "dfd7a8f38d4613b6a575253b3174dd991ca6183e" uuid = "0d47668e-0667-5a69-a72c-f761630bfb7e" version = "0.3.9+1" [[Xorg_xcb_util_wm_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_xcb_util_jll"] git-tree-sha1 = "e78d10aab01a4a154142c5006ed44fd9e8e31b67" uuid = "c22f9ab0-d5fe-5066-847c-f4bb1cd4e361" version = "0.4.1+1" [[Xorg_xkbcomp_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_libxkbfile_jll"] git-tree-sha1 = "4bcbf660f6c2e714f87e960a171b119d06ee163b" uuid = "35661453-b289-5fab-8a00-3d9160c6a3a4" version = "1.4.2+4" [[Xorg_xkeyboard_config_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Xorg_xkbcomp_jll"] git-tree-sha1 = "5c8424f8a67c3f2209646d4425f3d415fee5931d" uuid = "33bec58e-1273-512f-9401-5d533626f822" version = "2.27.0+4" [[Xorg_xtrans_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "79c31e7844f6ecf779705fbc12146eb190b7d845" uuid = "c5fb5394-a638-5e4d-96e5-b29de1b5cf10" version = "1.4.0+3" [[Zlib_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "320228915c8debb12cb434c59057290f0834dbf6" uuid = "83775a58-1f1d-513f-b197-d71354ab007a" version = "1.2.11+18" [[Zstd_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "6f1abcb0c44f184690912aa4b0ba861dd64f11b9" uuid = "3161d3a3-bdf6-5164-811a-617609db77b4" version = "1.4.5+2" [[ZygoteRules]] deps = ["MacroTools"] git-tree-sha1 = "9e7a1e8ca60b742e508a315c17eef5211e7fbfd7" uuid = "700de1a5-db45-46bc-99cf-38207098b444" version = "0.2.1" [[libass_jll]] deps = ["Artifacts", "Bzip2_jll", "FreeType2_jll", "FriBidi_jll", "JLLWrappers", "Libdl", "Pkg", "Zlib_jll"] git-tree-sha1 = "acc685bcf777b2202a904cdcb49ad34c2fa1880c" uuid = "0ac62f75-1d6f-5e53-bd7c-93b484bb37c0" version = "0.14.0+4" [[libfdk_aac_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "7a5780a0d9c6864184b3a2eeeb833a0c871f00ab" uuid = "f638f0a6-7fb0-5443-88ba-1cc74229b280" version = "0.1.6+4" [[libpng_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Zlib_jll"] git-tree-sha1 = "6abbc424248097d69c0c87ba50fcb0753f93e0ee" uuid = "b53b4c65-9356-5827-b1ea-8c7a1a84506f" version = "1.6.37+6" [[libvorbis_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Ogg_jll", "Pkg"] git-tree-sha1 = "fa14ac25af7a4b8a7f61b287a124df7aab601bcd" uuid = "f27f6e37-5d2b-51aa-960f-b287f2bc3b7a" version = "1.3.6+6" [[x264_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "d713c1ce4deac133e3334ee12f4adff07f81778f" uuid = "1270edf5-f2f9-52d2-97e9-ab00b5d0237a" version = "2020.7.14+2" [[x265_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "487da2f8f2f0c8ee0e83f39d13037d6bbf0a45ab" uuid = "dfaa095f-4041-5dcd-9319-2fabd8486b76" version = "3.0.0+3" [[xkbcommon_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Wayland_jll", "Wayland_protocols_jll", "Xorg_libxcb_jll", "Xorg_xkeyboard_config_jll"] git-tree-sha1 = "ece2350174195bb31de1a63bea3a41ae1aa593b6" uuid = "d8fb68d0-12a3-5cfd-a85a-d49703b185fd" version = "0.9.1+5" ```

Expected behavior

All tests should pass

Version info

Details on Julia:

Julia Version 1.5.2
Commit 539f3ce943 (2020-09-23 23:17 UTC)
Platform Info:
  OS: Linux (x86_64-pc-linux-gnu)
  CPU: Intel(R) Xeon(R) CPU E5-2667 v4 @ 3.20GHz
  WORD_SIZE: 64
  LIBM: libopenlibm
  LLVM: libLLVM-9.0.1 (ORCJIT, broadwell)
Environment:
  JULIA_NUM_THREADS = 16

Details on CUDA:

julia> CUDA.versioninfo()
CUDA toolkit 11.1.1, artifact installation
CUDA driver 11.1.0
NVIDIA driver 455.38.0

Libraries: 
- CUBLAS: 11.3.0
- CURAND: 10.2.2
- CUFFT: 10.3.0
- CUSOLVER: 11.0.1
- CUSPARSE: 11.3.0
- CUPTI: 14.0.0
- NVML: 11.0.0+455.38
- CUDNN: 8.0.4 (for CUDA 11.1.0)
- CUTENSOR: 1.2.1 (for CUDA 11.1.0)

Toolchain:
- Julia: 1.5.2
- LLVM: 9.0.1
- PTX ISA support: 3.2, 4.0, 4.1, 4.2, 4.3, 5.0, 6.0, 6.1, 6.3, 6.4
- Device support: sm_35, sm_37, sm_50, sm_52, sm_53, sm_60, sm_61, sm_62, sm_70, sm_72, sm_75

1 device:
  0: GeForce GTX 980 Ti (sm_52, 5.016 GiB / 5.940 GiB available)

Output [install via Artifacts and run Pkg.test("CUDA")]:

┌ Info: System information:
│ CUDA toolkit 11.1.1, artifact installation
│ CUDA driver 11.1.0
│ NVIDIA driver 455.38.0
│ 
│ Libraries: 
│ - CUBLAS: 11.3.0
│ - CURAND: 10.2.2
│ - CUFFT: 10.3.0
│ - CUSOLVER: 11.0.1
│ - CUSPARSE: 11.3.0
│ - CUPTI: 14.0.0
│ - NVML: 11.0.0+455.38
│ - CUDNN: 8.0.4 (for CUDA 11.1.0)
│ - CUTENSOR: 1.2.1 (for CUDA 11.1.0)
│ 
│ Toolchain:
│ - Julia: 1.5.2
│ - LLVM: 9.0.1
│ - PTX ISA support: 3.2, 4.0, 4.1, 4.2, 4.3, 5.0, 6.0, 6.1, 6.3, 6.4
│ - Device support: sm_35, sm_37, sm_50, sm_52, sm_53, sm_60, sm_61, sm_62, sm_70, sm_72, sm_75
│ 
│ 1 device:
└   0: GeForce GTX 980 Ti (sm_52, 4.912 GiB / 5.940 GiB available)
[ Info: Testing using 1 device(s): 1. GeForce GTX 980 Ti (UUID c4919b03-3ef2-6a21-a01c-ec04fc91cc3b)
[ Info: Skipping the following tests: cutensor/base, cutensor/contractions, cutensor/elementwise_binary, cutensor/elementwise_trinary, cutensor/permutations, cutensor/reductions, device/wmma
                                          |          | ---------------- GPU ---------------- | ---------------- CPU ---------------- |
Test                             (Worker) | Time (s) | GC (s) | GC % | Alloc (MB) | RSS (MB) | GC (s) | GC % | Alloc (MB) | RSS (MB) |
initialization                        (2) |     5.17 |   0.00 |  0.0 |       0.00 |    89.63 |   0.18 |  3.5 |     480.51 |  1422.18 |
curand                               (10) |     1.54 |   0.00 |  0.0 |       0.00 |    93.63 |   0.14 |  9.1 |     329.07 |  1422.41 |
apiutils                              (3) |     1.53 |   0.00 |  0.0 |       0.00 |    89.63 |   0.12 |  7.8 |     307.81 |  1422.18 |
nvml                                 (10) |     0.55 |   0.00 |  0.0 |       0.00 |    89.63 |   0.03 |  4.7 |      41.83 |  1422.41 |
nvtx                                  (3) |     0.51 |   0.00 |  0.0 |       0.00 |    89.63 |   0.03 |  6.7 |      63.21 |  1422.18 |
pointer                              (10) |     0.79 |   0.02 |  3.0 |       0.00 |    90.63 |   0.00 |  0.0 |      15.77 |  1422.41 |
iterator                             (17) |     4.65 |   0.12 |  2.6 |       1.07 |    90.63 |   0.22 |  4.6 |     561.80 |  1422.41 |
pool                                  (3) |     3.10 |   0.05 |  1.5 |       0.00 |    89.63 |   0.29 |  9.4 |     183.50 |  1422.18 |
codegen                               (6) |    15.94 |   0.02 |  0.1 |       0.00 |   104.75 |   0.77 |  4.9 |    1335.04 |  1422.18 |
threading                             (6) |     4.05 |   0.05 |  1.2 |      18.94 |   191.75 |   0.16 |  4.0 |     461.10 |  1636.42 |
nnlib                                 (2) |    19.43 |   0.05 |  0.2 |       4.00 |   166.75 |   0.77 |  4.0 |    1844.31 |  1493.20 |
cudadrv/context                       (2) |     0.49 |   0.00 |  0.0 |       0.00 |    89.63 |   0.00 |  0.0 |      16.45 |  1522.80 |
cudadrv/devices                       (2) |     0.36 |   0.00 |  0.0 |       0.00 |    89.63 |   0.01 |  3.5 |      36.71 |  1522.80 |
utils                                 (6) |     1.40 |   0.00 |  0.0 |       4.00 |   169.63 |   0.03 |  2.1 |     112.97 |  1644.32 |
random                               (10) |    19.11 |   0.05 |  0.3 |       0.02 |    98.75 |   0.82 |  4.3 |    1793.64 |  1422.41 |
cudadrv/events                        (6) |     0.15 |   0.00 |  0.0 |       0.00 |    97.63 |   0.01 |  8.1 |       8.13 |  1644.32 |
cudadrv/errors                        (2) |     0.30 |   0.00 |  0.0 |       0.00 |    89.63 |   0.02 |  6.0 |      17.54 |  1522.80 |
cudadrv/module                        (2) |     0.52 |   0.00 |  0.0 |       0.00 |    89.63 |   0.04 |  7.1 |      43.71 |  1522.80 |
cudadrv/execution                    (10) |     0.98 |   0.00 |  0.0 |       0.00 |    90.63 |   0.02 |  2.4 |      87.16 |  1422.41 |
cudadrv/occupancy                     (2) |     0.15 |   0.00 |  0.0 |       0.00 |    89.63 |   0.00 |  0.0 |       6.69 |  1522.80 |
cudadrv/profile                      (10) |     0.29 |   0.00 |  0.0 |       0.00 |    89.63 |   0.01 |  4.4 |      41.75 |  1422.41 |
cudadrv/stream                        (2) |     0.20 |   0.00 |  0.0 |       0.00 |    89.63 |   0.00 |  0.0 |      14.26 |  1522.80 |
cudadrv/version                      (10) |     0.01 |   0.00 |  0.0 |       0.00 |    89.63 |   0.00 |  0.0 |       0.07 |  1422.41 |
cudadrv/memory                        (6) |     2.10 |   0.00 |  0.0 |       0.00 |    98.63 |   0.07 |  3.2 |     179.54 |  1644.32 |
device/array                         (10) |     3.03 |   0.00 |  0.0 |       0.00 |    96.75 |   0.10 |  3.2 |     315.61 |  1422.41 |
statistics                           (17) |    25.80 |   0.00 |  0.0 |       0.00 |    96.75 |   1.13 |  4.4 |    2508.49 |  1422.41 |
gpuarrays/math                       (17) |     3.61 |   0.00 |  0.0 |       0.00 |    96.75 |   0.17 |  4.8 |     480.80 |  1422.41 |
device/ldg                           (10) |     6.70 |   0.00 |  0.0 |       0.00 |    96.75 |   0.21 |  3.1 |     783.77 |  1422.41 |
broadcast                             (5) |    37.58 |   0.07 |  0.2 |       0.00 |    96.75 |   1.13 |  3.0 |    3417.20 |  1422.18 |
gpuarrays/input output               (10) |     2.81 |   0.00 |  0.0 |       0.00 |    90.63 |   0.20 |  7.1 |     418.02 |  1422.41 |
gpuarrays/indexing scalar            (17) |     7.32 |   0.00 |  0.0 |       0.00 |    96.75 |   0.28 |  3.8 |     824.72 |  1422.41 |
cufft                                 (9) |    42.89 |   0.08 |  0.2 |     155.26 |   235.75 |   1.64 |  3.8 |    4141.28 |  1560.88 |
gpuarrays/interface                  (17) |     2.75 |   0.00 |  0.0 |       0.00 |    96.75 |   0.13 |  4.6 |     363.09 |  1422.41 |
cusolver/cusparse                     (2) |    22.16 |   0.00 |  0.0 |       0.19 |   259.75 |   1.25 |  5.6 |    2203.64 |  1956.57 |
gpuarrays/value constructors          (5) |    10.36 |   0.00 |  0.0 |       0.00 |    96.75 |   0.45 |  4.3 |    1342.23 |  1422.18 |
gpuarrays/iterator constructors       (9) |     5.73 |   0.00 |  0.0 |       0.02 |    96.75 |   0.23 |  4.0 |     668.61 |  1564.65 |
execution                            (15) |    49.64 |   0.05 |  0.1 |       0.02 |   158.50 |   1.73 |  3.5 |    5222.04 |  1422.41 |
gpuarrays/constructors                (9) |     1.59 |   0.00 |  0.2 |       0.03 |    90.63 |   0.03 |  2.1 |      99.81 |  1564.65 |
gpuarrays/conversions                 (5) |     4.14 |   0.00 |  0.0 |       0.01 |    90.63 |   0.13 |  3.2 |     438.49 |  1422.18 |
gpuarrays/uniformscaling             (17) |     7.93 |   0.00 |  0.0 |       0.01 |    96.75 |   0.28 |  3.6 |     794.75 |  1422.41 |
gpuarrays/indexing multidimensional  (10) |    22.74 |   0.00 |  0.0 |       0.69 |    96.75 |   1.15 |  5.1 |    2589.09 |  1422.41 |
cusparse                             (12) |    67.02 |   0.08 |  0.1 |       9.71 |   219.75 |   2.52 |  3.8 |    6237.53 |  1743.37 |
texture                               (3) |    63.22 |   0.00 |  0.0 |       0.09 |    98.75 |   2.96 |  4.7 |    6827.76 |  1422.18 |
gpuarrays/base                        (9) |    19.08 |   0.00 |  0.0 |      17.44 |   128.75 |   1.18 |  6.2 |    2443.49 |  1620.52 |
gpuarrays/random                     (15) |    20.16 |   0.00 |  0.0 |       0.03 |   106.75 |   0.64 |  3.2 |    1956.95 |  1477.34 |
array                                 (4) |    71.47 |   0.07 |  0.1 |       5.20 |   104.75 |   2.90 |  4.1 |    7746.65 |  1436.29 |
cudnn                                 (8) |    74.40 |   0.07 |  0.1 |       0.89 |   218.75 |   2.67 |  3.6 |    7394.19 |  1837.51 |
forwarddiff                          (16) |    87.19 |   0.07 |  0.1 |       0.00 |    96.75 |   1.98 |  2.3 |    5060.42 |  1422.41 |
cusolver                             (11) |    88.64 |   0.14 |  0.2 |    1298.29 |   321.75 |   3.63 |  4.1 |    8969.10 |  2017.83 |
exceptions                           (14) |    99.46 |   0.00 |  0.0 |       0.00 |    89.63 |   0.21 |  0.2 |     491.65 |  1422.41 |
cublas                                (7) |         failed at 2020-12-26T13:09:30.626
gpuarrays/broadcasting               (17) |    68.76 |   0.00 |  0.0 |       1.19 |    97.75 |   3.15 |  4.6 |    8410.12 |  1526.72 |
gpuarrays/linear algebra              (2) |    76.54 |   0.01 |  0.0 |       5.24 |   169.75 |   2.52 |  3.3 |    7122.20 |  1956.57 |
device/intrinsics                     (6) |    98.50 |   0.00 |  0.0 |       0.01 |   491.50 |   2.79 |  2.8 |    9007.35 |  1682.77 |
examples                             (13) |   132.55 |   0.00 |  0.0 |       0.00 |    89.63 |   0.25 |  0.2 |     485.51 |  1422.41 |
gpuarrays/mapreduce essentials        (5) |   111.48 |   0.01 |  0.0 |       3.19 |    98.75 |   5.16 |  4.6 |   13744.60 |  1552.70 |
gpuarrays/mapreduce derivatives      (10) |   191.23 |   0.01 |  0.0 |       3.06 |   100.75 |   8.29 |  4.3 |   19189.68 |  1918.55 |
Worker 7 failed running test cublas:
Some tests did not pass: 1908 passed, 0 failed, 1 errored, 0 broken.
cublas: Error During Test at /home/me/.julia/packages/CUDA/YeS8q/test/cublas.jl:1250
  Got exception outside of a @test
  CUBLASError: an absent device architectural feature is required (code 8, CUBLAS_STATUS_ARCH_MISMATCH)
  Stacktrace:
   [1] throw_api_error(::CUDA.CUBLAS.cublasStatus_t) at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/error.jl:47
   [2] macro expansion at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/error.jl:58 [inlined]
   [3] cublasGemmEx(::Ptr{Nothing}, ::Char, ::Char, ::Int64, ::Int64, ::Int64, ::Base.RefValue{Float16}, ::CuArray{Float16,2}, ::Type{T} where T, ::Int64, ::CuArray{Float16,2}, ::Type{T} where T, ::Int64, ::Base.RefValue{Float16}, ::CuArray{Float16,2}, ::Type{T} where T, ::Int64, ::CUDA.CUBLAS.cublasComputeType_t, ::CUDA.CUBLAS.cublasGemmAlgo_t) at /home/me/.julia/packages/CUDA/YeS8q/lib/utils/call.jl:93
   [4] gemmEx!(::Char, ::Char, ::Number, ::Union{CuArray{T,1}, CuArray{T,2}} where T, ::Union{CuArray{T,1}, CuArray{T,2}} where T, ::Number, ::Union{CuArray{T,1}, CuArray{T,2}} where T; algo::CUDA.CUBLAS.cublasGemmAlgo_t) at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/wrappers.jl:836
   [5] gemmEx! at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/wrappers.jl:818 [inlined]
   [6] gemm_dispatch!(::CuArray{Float16,2}, ::CuArray{Float16,2}, ::CuArray{Float16,2}, ::Bool, ::Bool) at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/linalg.jl:216
   [7] mul! at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/linalg.jl:227 [inlined]
   [8] mul!(::CuArray{Float16,2}, ::CuArray{Float16,2}, ::CuArray{Float16,2}) at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/LinearAlgebra/src/matmul.jl:208
   [9] top-level scope at /home/me/.julia/packages/CUDA/YeS8q/test/cublas.jl:1275
   [10] top-level scope at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Test/src/Test.jl:1115
   [11] top-level scope at /home/me/.julia/packages/CUDA/YeS8q/test/cublas.jl:1251
   [12] top-level scope at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Test/src/Test.jl:1115
   [13] top-level scope at /home/me/.julia/packages/CUDA/YeS8q/test/cublas.jl:438
   [14] include(::String) at ./client.jl:457
   [15] #9 at /home/me/.julia/packages/CUDA/YeS8q/test/runtests.jl:78 [inlined]
   [16] macro expansion at /home/me/.julia/packages/CUDA/YeS8q/test/setup.jl:47 [inlined]
   [17] macro expansion at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Test/src/Test.jl:1115 [inlined]
   [18] macro expansion at /home/me/.julia/packages/CUDA/YeS8q/test/setup.jl:47 [inlined]
   [19] macro expansion at /home/me/.julia/packages/CUDA/YeS8q/src/utilities.jl:35 [inlined]
   [20] macro expansion at /home/me/.julia/packages/CUDA/YeS8q/src/pool.jl:564 [inlined]
   [21] top-level scope at /home/me/.julia/packages/CUDA/YeS8q/test/setup.jl:46
   [22] eval at ./boot.jl:331 [inlined]
   [23] runtests(::Function, ::String, ::Symbol, ::Nothing) at /home/me/.julia/packages/CUDA/YeS8q/test/setup.jl:58
   [24] (::Distributed.var"#106#108"{Distributed.CallMsg{:call_fetch}})() at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Distributed/src/process_messages.jl:294
   [25] run_work_thunk(::Distributed.var"#106#108"{Distributed.CallMsg{:call_fetch}}, ::Bool) at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Distributed/src/process_messages.jl:79
   [26] macro expansion at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Distributed/src/process_messages.jl:294 [inlined]
   [27] (::Distributed.var"#105#107"{Distributed.CallMsg{:call_fetch},Distributed.MsgHeader,Sockets.TCPSocket})() at ./task.jl:356

Test Summary:                         | Pass  Error  Broken  Total
  Overall                             | 8453      1       5   8459
    initialization                    |   25                    25
    curand                            |    1                     1
    apiutils                          |   15                    15
    nvml                              |    7                     7
    nvtx                              |                      No tests
    pointer                           |   35                    35
    iterator                          |   30                    30
    pool                              |   10                    10
    codegen                           |    9                     9
    threading                         |                      No tests
    nnlib                             |   17                    17
    cudadrv/context                   |   12                    12
    cudadrv/devices                   |    6                     6
    utils                             |    5                     5
    random                            |  101                   101
    cudadrv/events                    |    6                     6
    cudadrv/errors                    |    6                     6
    cudadrv/module                    |   12                    12
    cudadrv/execution                 |   15                    15
    cudadrv/occupancy                 |    1                     1
    cudadrv/profile                   |    2                     2
    cudadrv/stream                    |    7                     7
    cudadrv/version                   |    3                     3
    cudadrv/memory                    |   49              1     50
    device/array                      |   18                    18
    statistics                        |   18                    18
    gpuarrays/math                    |    8                     8
    device/ldg                        |   22                    22
    broadcast                         |   29                    29
    gpuarrays/input output            |    5                     5
    gpuarrays/indexing scalar         |  249                   249
    cufft                             |  175                   175
    gpuarrays/interface               |    7                     7
    cusolver/cusparse                 |   84                    84
    gpuarrays/value constructors      |   36                    36
    gpuarrays/iterator constructors   |   24                    24
    execution                         |   65                    65
    gpuarrays/constructors            |  335                   335
    gpuarrays/conversions             |   72                    72
    gpuarrays/uniformscaling          |   56                    56
    gpuarrays/indexing multidimensional |   34                    34
    cusparse                          |  630                   630
    texture                           |   38              4     42
    gpuarrays/base                    |   39                    39
    gpuarrays/random                  |   46                    46
    array                             |  180                   180
    cudnn                             |  147                   147
    forwarddiff                       |  107                   107
    cusolver                          | 1580                  1580
    exceptions                        |   17                    17
    cublas                            | 1908      1           1909
    gpuarrays/broadcasting            |  155                   155
    gpuarrays/linear algebra          |  389                   389
    device/intrinsics                 |  250                   250
    examples                          |    7                     7
    gpuarrays/mapreduce essentials    |  522                   522
    gpuarrays/mapreduce derivatives   |  827                   827
    FAILURE

Error in testset cublas:
Error During Test at /home/me/.julia/packages/CUDA/YeS8q/test/cublas.jl:1250
  Got exception outside of a @test
  CUBLASError: an absent device architectural feature is required (code 8, CUBLAS_STATUS_ARCH_MISMATCH)
  Stacktrace:
   [1] throw_api_error(::CUDA.CUBLAS.cublasStatus_t) at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/error.jl:47
   [2] macro expansion at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/error.jl:58 [inlined]
   [3] cublasGemmEx(::Ptr{Nothing}, ::Char, ::Char, ::Int64, ::Int64, ::Int64, ::Base.RefValue{Float16}, ::CuArray{Float16,2}, ::Type{T} where T, ::Int64, ::CuArray{Float16,2}, ::Type{T} where T, ::Int64, ::Base.RefValue{Float16}, ::CuArray{Float16,2}, ::Type{T} where T, ::Int64, ::CUDA.CUBLAS.cublasComputeType_t, ::CUDA.CUBLAS.cublasGemmAlgo_t) at /home/me/.julia/packages/CUDA/YeS8q/lib/utils/call.jl:93
   [4] gemmEx!(::Char, ::Char, ::Number, ::Union{CuArray{T,1}, CuArray{T,2}} where T, ::Union{CuArray{T,1}, CuArray{T,2}} where T, ::Number, ::Union{CuArray{T,1}, CuArray{T,2}} where T; algo::CUDA.CUBLAS.cublasGemmAlgo_t) at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/wrappers.jl:836
   [5] gemmEx! at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/wrappers.jl:818 [inlined]
   [6] gemm_dispatch!(::CuArray{Float16,2}, ::CuArray{Float16,2}, ::CuArray{Float16,2}, ::Bool, ::Bool) at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/linalg.jl:216
   [7] mul! at /home/me/.julia/packages/CUDA/YeS8q/lib/cublas/linalg.jl:227 [inlined]
   [8] mul!(::CuArray{Float16,2}, ::CuArray{Float16,2}, ::CuArray{Float16,2}) at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/LinearAlgebra/src/matmul.jl:208
   [9] top-level scope at /home/me/.julia/packages/CUDA/YeS8q/test/cublas.jl:1275
   [10] top-level scope at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Test/src/Test.jl:1115
   [11] top-level scope at /home/me/.julia/packages/CUDA/YeS8q/test/cublas.jl:1251
   [12] top-level scope at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Test/src/Test.jl:1115
   [13] top-level scope at /home/me/.julia/packages/CUDA/YeS8q/test/cublas.jl:438
   [14] include(::String) at ./client.jl:457
   [15] #9 at /home/me/.julia/packages/CUDA/YeS8q/test/runtests.jl:78 [inlined]
   [16] macro expansion at /home/me/.julia/packages/CUDA/YeS8q/test/setup.jl:47 [inlined]
   [17] macro expansion at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Test/src/Test.jl:1115 [inlined]
   [18] macro expansion at /home/me/.julia/packages/CUDA/YeS8q/test/setup.jl:47 [inlined]
   [19] macro expansion at /home/me/.julia/packages/CUDA/YeS8q/src/utilities.jl:35 [inlined]
   [20] macro expansion at /home/me/.julia/packages/CUDA/YeS8q/src/pool.jl:564 [inlined]
   [21] top-level scope at /home/me/.julia/packages/CUDA/YeS8q/test/setup.jl:46
   [22] eval at ./boot.jl:331 [inlined]
   [23] runtests(::Function, ::String, ::Symbol, ::Nothing) at /home/me/.julia/packages/CUDA/YeS8q/test/setup.jl:58
   [24] (::Distributed.var"#106#108"{Distributed.CallMsg{:call_fetch}})() at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Distributed/src/process_messages.jl:294
   [25] run_work_thunk(::Distributed.var"#106#108"{Distributed.CallMsg{:call_fetch}}, ::Bool) at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Distributed/src/process_messages.jl:79
   [26] macro expansion at /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.5/Distributed/src/process_messages.jl:294 [inlined]
   [27] (::Distributed.var"#105#107"{Distributed.CallMsg{:call_fetch},Distributed.MsgHeader,Sockets.TCPSocket})() at ./task.jl:356

ERROR: LoadError: Test run finished with errors
in expression starting at /home/me/.julia/packages/CUDA/YeS8q/test/runtests.jl:483
maleadt commented 3 years ago

Can you run the CUBLAS tests with JULIA_DEBUG=CUBLAS? For example, using:

$ JULIA_DEBUG=CUBLAS julia -e 'using Pkg; Pkg.test("CUDA"; test_args=`cublas`)'

This will generate a lot of output.

mkarikom commented 3 years ago

Thanks @maleadt, please see attached for outputs from the 980ti and 3090. I redirected the output to a file, but after generating a lot of output it appeared to hang, so I killed it manually.
Please let me know if there is anything missing.

output980.txt output3090.txt

maleadt commented 3 years ago

Those logs don't actually contain any test results, they seem to have hung as you describe. Can you try the following instead (you may have to install some of the dependencies here):

julia> ENV["JULIA_DEBUG"] = "CUBLAS"
"CUBLAS"

julia> using CUDA

julia> using LinearAlgebra, Test, BFloat16s

julia> m = 20
20

julia> n = 35
35

julia> k = 13
13

julia> Base.eps(::Type{BFloat16}) = Base.bitcast(BFloat16, 0x3c00)

julia> @testset "mixed-precision matmul" begin
           m,k,n = 4,4,4
           cudaTypes = (Float16, Complex{Float16}, BFloat16, Complex{BFloat16}, Float32, Complex{Float32},
                       Float64, Complex{Float64}, Int8, Complex{Int8}, UInt8, Complex{UInt8},
                       Int16, Complex{Int16}, UInt16, Complex{UInt16}, Int32, Complex{Int32},
                       UInt32, Complex{UInt32}, Int64, Complex{Int64}, UInt64, Complex{UInt64})

           for AT in cudaTypes, CT in cudaTypes
               BT = AT # gemmEx requires identical A and B types

               # we only test combinations of types that are supported by gemmEx
               if CUBLAS.gemmExComputeType(AT, BT, CT, m,k,n) !== nothing
                   A = AT <: BFloat16 ? AT.(rand(m,k)) : rand(AT, m,k)
                   B = BT <: BFloat16 ? BT.(rand(k,n)) : rand(BT, k,n)
                   C = similar(B, CT)
                   mul!(C, A, B)

                   # Base can't do Int8*Int8 without losing accuracy
                   if (AT == Int8 && BT == Int8) || (AT == Complex{Int8} && BT == Complex{Int8})
                       C = CT.(A) * CT.(B)
                   end

                   dA = CuArray(A)
                   dB = CuArray(B)
                   dC = similar(dB, CT)
                   mul!(dC, dA, dB)

                   rtol = Base.rtoldefault(AT, BT, 0)
                   @test C ≈ Array(dC) rtol=rtol
               end
           end
       end
mkarikom commented 3 years ago

ok, thanks. gpu is tied up right now but ill try to post these in a day or so

maleadt commented 3 years ago

And FWIW, after https://github.com/JuliaGPU/CUDA.jl/pull/649 it should now also be possible to run the entire CUBLAS test suite under JULIA_DEBUG, so you can pick either approach.

Talinx commented 3 years ago

I have the same issue. Output of the mixed-precision matmul test: gemmExTestOutput.txt

I found this forum-post, maybe it is related?

Manifest.toml

``` # This file is machine-generated - editing it directly is not advised [[AbstractFFTs]] deps = ["LinearAlgebra"] git-tree-sha1 = "051c95d6836228d120f5f4b984dd5aba1624f716" uuid = "621f4979-c628-5d54-868e-fcf4e3e8185c" version = "0.5.0" [[AbstractTrees]] deps = ["Markdown"] git-tree-sha1 = "33e450545eaf7699da1a6e755f9ea65f14077a45" uuid = "1520ce14-60c1-5f80-bbc7-55ef81b5835c" version = "0.3.3" [[Adapt]] deps = ["LinearAlgebra"] git-tree-sha1 = "ffcfa2d345aaee0ef3d8346a073d5dd03c983ebe" uuid = "79e6a3ab-5dfb-504d-930d-738a2a938a0e" version = "3.2.0" [[ArrayInterface]] deps = ["IfElse", "LinearAlgebra", "Requires", "SparseArrays"] git-tree-sha1 = "ee07ae00e3cc277dcfa5507ce25be522313ecc3e" uuid = "4fba245c-0d91-5ea0-9b3e-6abc04ee57a9" version = "3.1.1" [[Artifacts]] deps = ["Pkg"] git-tree-sha1 = "c30985d8821e0cd73870b17b0ed0ce6dc44cb744" uuid = "56f22d72-fd6d-98f1-02f0-08ddc0907c33" version = "1.3.0" [[AxisAlgorithms]] deps = ["LinearAlgebra", "Random", "SparseArrays", "WoodburyMatrices"] git-tree-sha1 = "a4d07a1c313392a77042855df46c5f534076fab9" uuid = "13072b0f-2c55-5437-9ae7-d433b7a33950" version = "1.0.0" [[AxisArrays]] deps = ["Dates", "IntervalSets", "IterTools", "RangeArrays"] git-tree-sha1 = "f31f50712cbdf40ee8287f0443b57503e34122ef" uuid = "39de3d68-74b9-583c-8d2d-e117c070f3a9" version = "0.4.3" [[BFloat16s]] deps = ["LinearAlgebra", "Test"] git-tree-sha1 = "4af69e205efc343068dc8722b8dfec1ade89254a" uuid = "ab4f0b2a-ad5b-11e8-123f-65d77653426b" version = "0.1.0" [[BSON]] git-tree-sha1 = "dd36d7cf3d185eeaaf64db902c15174b22f5dafb" uuid = "fbb218c0-5317-5bc6-957e-2ee96dd4b1f0" version = "0.2.6" [[Base64]] uuid = "2a0f44e3-6c83-55bd-87e4-b1978d98bd5f" [[CEnum]] git-tree-sha1 = "215a9aa4a1f23fbd05b92769fdd62559488d70e9" uuid = "fa961155-64e5-5f13-b03f-caf6b980ea82" version = "0.4.1" [[CSV]] deps = ["Dates", "Mmap", "Parsers", "PooledArrays", "SentinelArrays", "Tables", "Unicode"] git-tree-sha1 = "1f79803452adf73e2d3fc84785adb7aaca14db36" uuid = "336ed68f-0bac-5ca0-87d4-7b16caf5d00b" version = "0.8.3" [[CUDA]] deps = ["AbstractFFTs", "Adapt", "BFloat16s", "CEnum", "CompilerSupportLibraries_jll", "DataStructures", "ExprTools", "GPUArrays", "GPUCompiler", "LLVM", "Libdl", "LinearAlgebra", "Logging", "MacroTools", "NNlib", "Pkg", "Printf", "Random", "Reexport", "Requires", "SparseArrays", "Statistics", "TimerOutputs"] git-tree-sha1 = "6ccc73b2d8b671f7a65c92b5f08f81422ebb7547" pinned = true uuid = "052768ef-5323-5732-b1bb-66c8b64840ba" version = "2.4.1" [[CatIndices]] deps = ["CustomUnitRanges", "OffsetArrays"] git-tree-sha1 = "a0f80a09780eed9b1d106a1bf62041c2efc995bc" uuid = "aafaddc9-749c-510e-ac4f-586e18779b91" version = "0.2.2" [[CategoricalArrays]] deps = ["DataAPI", "Future", "JSON", "Missings", "Printf", "Statistics", "StructTypes", "Unicode"] git-tree-sha1 = "99809999c8ee01fa89498480b147f7394ea5450f" uuid = "324d7699-5711-5eae-9e2f-1d82baa6b597" version = "0.9.2" [[ChainRules]] deps = ["ChainRulesCore", "Compat", "LinearAlgebra", "Random", "Reexport", "Requires", "Statistics"] git-tree-sha1 = "56bbb956a573ac16b277008edb1762ef80076e78" uuid = "082447d4-558c-5d27-93f4-14fc19e9eca2" version = "0.7.50" [[ChainRulesCore]] deps = ["Compat", "LinearAlgebra", "SparseArrays"] git-tree-sha1 = "d3d0a4e0d5bc03a6c97f4d249c8a471fc20a2f33" uuid = "d360d2e6-b24c-11e9-a2a3-2a2ae2dbcce4" version = "0.9.28" [[CodecZlib]] deps = ["TranscodingStreams", "Zlib_jll"] git-tree-sha1 = "ded953804d019afa9a3f98981d99b33e3db7b6da" uuid = "944b1d66-785c-5afd-91f1-9de20f533193" version = "0.7.0" [[ColorTypes]] deps = ["FixedPointNumbers", "Random"] git-tree-sha1 = "4bffea7ed1a9f0f3d1a131bbcd4b925548d75288" uuid = "3da002f7-5984-5a60-b8a6-cbb66c0b333f" version = "0.10.9" [[ColorVectorSpace]] deps = ["ColorTypes", "Colors", "FixedPointNumbers", "LinearAlgebra", "SpecialFunctions", "Statistics", "StatsBase"] git-tree-sha1 = "4d17724e99f357bfd32afa0a9e2dda2af31a9aea" uuid = "c3611d14-8923-5661-9e6a-0046d554d3a4" version = "0.8.7" [[Colors]] deps = ["ColorTypes", "FixedPointNumbers", "InteractiveUtils", "Reexport"] git-tree-sha1 = "ac5f2213e56ed8a34a3dd2f681f4df1166b34929" uuid = "5ae59095-9a9b-59fe-a467-6f913c188581" version = "0.12.6" [[CommonSubexpressions]] deps = ["MacroTools", "Test"] git-tree-sha1 = "7b8a93dba8af7e3b42fecabf646260105ac373f7" uuid = "bbf7d656-a473-5ed7-a52c-81e309532950" version = "0.3.0" [[Compat]] deps = ["Base64", "Dates", "DelimitedFiles", "Distributed", "InteractiveUtils", "LibGit2", "Libdl", "LinearAlgebra", "Markdown", "Mmap", "Pkg", "Printf", "REPL", "Random", "SHA", "Serialization", "SharedArrays", "Sockets", "SparseArrays", "Statistics", "Test", "UUIDs", "Unicode"] git-tree-sha1 = "919c7f3151e79ff196add81d7f4e45d91bbf420b" uuid = "34da2185-b29b-5c13-b0c7-acf172513d20" version = "3.25.0" [[CompilerSupportLibraries_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "8e695f735fca77e9708e795eda62afdb869cbb70" uuid = "e66e0078-7015-5450-92f7-15fbd957f2ae" version = "0.3.4+0" [[ComputationalResources]] git-tree-sha1 = "52cb3ec90e8a8bea0e62e275ba577ad0f74821f7" uuid = "ed09eef8-17a6-5b46-8889-db040fac31e3" version = "0.3.2" [[CoordinateTransformations]] deps = ["LinearAlgebra", "StaticArrays"] git-tree-sha1 = "6d1c23e740a586955645500bbec662476204a52c" uuid = "150eb455-5306-5404-9cee-2592286d6298" version = "0.6.1" [[Crayons]] git-tree-sha1 = "3f71217b538d7aaee0b69ab47d9b7724ca8afa0d" uuid = "a8cc5b0e-0ffa-5ad4-8c14-923d3ee1735f" version = "4.0.4" [[CustomUnitRanges]] git-tree-sha1 = "537c988076d001469093945f3bd0b300b8d3a7f3" uuid = "dc8bdbbb-1ca9-579f-8c36-e416f6a65cce" version = "1.0.1" [[DataAPI]] git-tree-sha1 = "8ab70b4de35bb3b8cc19654f6b893cf5164f8ee8" uuid = "9a962f9c-6df0-11e9-0e5d-c546b8b5ee8a" version = "1.5.1" [[DataFrames]] deps = ["CategoricalArrays", "Compat", "DataAPI", "Future", "InvertedIndices", "IteratorInterfaceExtensions", "LinearAlgebra", "Markdown", "Missings", "PooledArrays", "PrettyTables", "Printf", "REPL", "Reexport", "SortingAlgorithms", "Statistics", "TableTraits", "Tables", "Unicode"] git-tree-sha1 = "b0db5579803eabb33f1274ca7ca2f472fdfb7f2a" uuid = "a93c6f00-e57d-5684-b7b6-d8193f3e46c0" version = "0.22.5" [[DataStructures]] deps = ["Compat", "InteractiveUtils", "OrderedCollections"] git-tree-sha1 = "4437b64df1e0adccc3e5d1adbc3ac741095e4677" uuid = "864edb3b-99cc-5e75-8d2d-829cb0a9cfe8" version = "0.18.9" [[DataValueInterfaces]] git-tree-sha1 = "bfc1187b79289637fa0ef6d4436ebdfe6905cbd6" uuid = "e2d170a0-9d28-54be-80f0-106bbe20a464" version = "1.0.0" [[Dates]] deps = ["Printf"] uuid = "ade2ca70-3891-5945-98fb-dc099432e06a" [[DelimitedFiles]] deps = ["Mmap"] uuid = "8bb1440f-4735-579b-a4ab-409b98df4dab" [[DiffResults]] deps = ["StaticArrays"] git-tree-sha1 = "c18e98cba888c6c25d1c3b048e4b3380ca956805" uuid = "163ba53b-c6d8-5494-b064-1a9d43ac40c5" version = "1.0.3" [[DiffRules]] deps = ["NaNMath", "Random", "SpecialFunctions"] git-tree-sha1 = "214c3fcac57755cfda163d91c58893a8723f93e9" uuid = "b552c78f-8df3-52c6-915a-8e097449b14b" version = "1.0.2" [[Distances]] deps = ["LinearAlgebra", "Statistics"] git-tree-sha1 = "366715149014943abd71aa647a07a43314158b2d" uuid = "b4f34e82-e78d-54a5-968a-f98e89d6e8f7" version = "0.10.2" [[Distributed]] deps = ["Random", "Serialization", "Sockets"] uuid = "8ba89e20-285c-5b6f-9357-94700520ee1b" [[EllipsisNotation]] deps = ["ArrayInterface"] git-tree-sha1 = "8041575f021cba5a099a456b4163c9a08b566a02" uuid = "da5c29d0-fa7d-589e-88eb-ea29b0a81949" version = "1.1.0" [[ExprTools]] git-tree-sha1 = "10407a39b87f29d47ebaca8edbc75d7c302ff93e" uuid = "e2ba6199-217a-4e67-a87a-7c52f15ade04" version = "0.1.3" [[FFTViews]] deps = ["CustomUnitRanges", "FFTW"] git-tree-sha1 = "70a0cfd9b1c86b0209e38fbfe6d8231fd606eeaf" uuid = "4f61f5a4-77b1-5117-aa51-3ab5ef4ef0cd" version = "0.3.1" [[FFTW]] deps = ["AbstractFFTs", "FFTW_jll", "IntelOpenMP_jll", "Libdl", "LinearAlgebra", "MKL_jll", "Reexport"] git-tree-sha1 = "8fda0934cb99db617171f7296dc361f4d6fa5424" uuid = "7a1cc6ca-52ef-59f5-83cd-3a7055c09341" version = "1.3.0" [[FFTW_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "5a0d4b6a22a34d17d53543bd124f4b08ed78e8b0" uuid = "f5851436-0d7a-5f13-b9de-f02708fd171a" version = "3.3.9+7" [[FileIO]] deps = ["Pkg"] git-tree-sha1 = "fee8955b9dfa7bec67117ef48085fb2b559b9c22" uuid = "5789e2e9-d7fb-5bc7-8068-2c6fae9b9549" version = "1.4.5" [[FillArrays]] deps = ["LinearAlgebra", "Random", "SparseArrays"] git-tree-sha1 = "50eabdace27aa27b143f65b65e762bb0112a7708" uuid = "1a297f60-69ca-5386-bcde-b61e274b549b" version = "0.11.1" [[FixedPointNumbers]] deps = ["Statistics"] git-tree-sha1 = "335bfdceacc84c5cdf16aadc768aa5ddfc5383cc" uuid = "53c48c17-4a7d-5ca2-90c5-79b7896eea93" version = "0.8.4" [[Flux]] deps = ["AbstractTrees", "Adapt", "CUDA", "CodecZlib", "Colors", "DelimitedFiles", "Functors", "Juno", "LinearAlgebra", "MacroTools", "NNlib", "Pkg", "Printf", "Random", "Reexport", "SHA", "Statistics", "StatsBase", "Test", "ZipFile", "Zygote"] git-tree-sha1 = "c443bf5a8329573a68364106b2c29bb6938dc6f5" uuid = "587475ba-b771-5e3f-ad9e-33799f191a9c" version = "0.11.6" [[Formatting]] deps = ["Printf"] git-tree-sha1 = "8339d61043228fdd3eb658d86c926cb282ae72a8" uuid = "59287772-0a20-5a39-b81b-1366585eb4c0" version = "0.4.2" [[ForwardDiff]] deps = ["CommonSubexpressions", "DiffResults", "DiffRules", "NaNMath", "Random", "SpecialFunctions", "StaticArrays"] git-tree-sha1 = "d48a40c0f54f29a5c8748cfb3225719accc72b77" uuid = "f6369f11-7733-5829-9624-2563aa707210" version = "0.10.16" [[Functors]] deps = ["MacroTools"] git-tree-sha1 = "f40adc6422f548176bb4351ebd29e4abf773040a" uuid = "d9f16b24-f501-4c13-a1f2-28368ffc5196" version = "0.1.0" [[Future]] deps = ["Random"] uuid = "9fa8497b-333b-5362-9e8d-4d0656e87820" [[FuzzyCompletions]] deps = ["REPL"] git-tree-sha1 = "5ca3ddf3061771d25d1699ce53a80a39300811e3" uuid = "fb4132e2-a121-4a70-b8a1-d5b831dcdcc2" version = "0.4.0" [[GPUArrays]] deps = ["AbstractFFTs", "Adapt", "LinearAlgebra", "Printf", "Random", "Serialization"] git-tree-sha1 = "f99a25fe0313121f2f9627002734c7d63b4dd3bd" uuid = "0c68f7d7-f131-5f86-a1c3-88cf8149b2d7" version = "6.2.0" [[GPUCompiler]] deps = ["DataStructures", "InteractiveUtils", "LLVM", "Libdl", "Scratch", "Serialization", "TimerOutputs", "UUIDs"] git-tree-sha1 = "c853c810b52a80f9aad79ab109207889e57f41ef" uuid = "61eb1bfa-7361-4325-ad38-22787b887f55" version = "0.8.3" [[Graphics]] deps = ["Colors", "LinearAlgebra", "NaNMath"] git-tree-sha1 = "2c1cf4df419938ece72de17f368a021ee162762e" uuid = "a2bd30eb-e257-5431-a919-1863eab51364" version = "1.1.0" [[HTTP]] deps = ["Base64", "Dates", "IniFile", "MbedTLS", "Sockets", "URIs"] git-tree-sha1 = "942c1a9c750bbe79912b7bd060a420932afd35b8" uuid = "cd3eb016-35fb-5094-929b-558a96fad6f3" version = "0.9.3" [[IRTools]] deps = ["InteractiveUtils", "MacroTools", "Test"] git-tree-sha1 = "c67e7515a11f726f44083e74f218d134396d6510" uuid = "7869d1d1-7146-5819-86e3-90919afe41df" version = "0.4.2" [[IdentityRanges]] deps = ["OffsetArrays"] git-tree-sha1 = "be8fcd695c4da16a1d6d0cd213cb88090a150e3b" uuid = "bbac6d45-d8f3-5730-bfe4-7a449cd117ca" version = "0.3.1" [[IfElse]] git-tree-sha1 = "28e837ff3e7a6c3cdb252ce49fb412c8eb3caeef" uuid = "615f187c-cbe4-4ef1-ba3b-2fcf58d6d173" version = "0.1.0" [[ImageAxes]] deps = ["AxisArrays", "ImageCore", "Reexport", "SimpleTraits"] git-tree-sha1 = "1592c7fd668ac9cdcef73f704ca457ccdaac2933" uuid = "2803e5a7-5153-5ecf-9a86-9b4c37f5f5ac" version = "0.6.8" [[ImageContrastAdjustment]] deps = ["ColorVectorSpace", "ImageCore", "ImageTransformations", "Parameters"] git-tree-sha1 = "210f8fb370d4b97fa12d65322c62df06f3e5563b" uuid = "f332f351-ec65-5f6a-b3d1-319c6670881a" version = "0.3.6" [[ImageCore]] deps = ["AbstractFFTs", "Colors", "FixedPointNumbers", "Graphics", "MappedArrays", "MosaicViews", "OffsetArrays", "PaddedViews", "Reexport"] git-tree-sha1 = "79badd979fbee9b8980cd995cd5a86a9e93b8ad7" uuid = "a09fc81d-aa75-5fe9-8630-4744c3626534" version = "0.8.20" [[ImageDistances]] deps = ["ColorVectorSpace", "Distances", "ImageCore", "ImageMorphology", "LinearAlgebra", "Statistics"] git-tree-sha1 = "159e24b4313d9197eef900e97fbd7365986f2844" uuid = "51556ac3-7006-55f5-8cb3-34580c88182d" version = "0.2.10" [[ImageFiltering]] deps = ["CatIndices", "ColorVectorSpace", "ComputationalResources", "DataStructures", "FFTViews", "FFTW", "ImageCore", "ImageMetadata", "LinearAlgebra", "OffsetArrays", "Requires", "SparseArrays", "StaticArrays", "Statistics", "TiledIteration"] git-tree-sha1 = "f82a52fa2e684d4ed69028b16188852ff94b3f75" uuid = "6a3955dd-da59-5b1f-98d4-e7296123deb5" version = "0.6.19" [[ImageIO]] deps = ["FileIO", "Netpbm", "PNGFiles"] git-tree-sha1 = "0d6d09c28d67611c68e25af0c2df7269c82b73c7" uuid = "82e4d734-157c-48bb-816b-45c225c6df19" version = "0.4.1" [[ImageMagick]] deps = ["FileIO", "ImageCore", "ImageMagick_jll", "InteractiveUtils", "Libdl", "Pkg", "Random"] git-tree-sha1 = "02558f83932fde6ebd3ab007dbff6bd8740a8247" uuid = "6218d12a-5da1-5696-b52f-db25d2ecc6d1" version = "1.1.6" [[ImageMagick_jll]] deps = ["JpegTurbo_jll", "Libdl", "Libtiff_jll", "Pkg", "Zlib_jll", "libpng_jll"] git-tree-sha1 = "1c0a2295cca535fabaf2029062912591e9b61987" uuid = "c73af94c-d91f-53ed-93a7-00f77d67a9d7" version = "6.9.10-12+3" [[ImageMetadata]] deps = ["AxisArrays", "ColorVectorSpace", "ImageAxes", "ImageCore", "IndirectArrays"] git-tree-sha1 = "ff77c7f234e7d8a618958fcf23b6959f2cbef2c6" uuid = "bc367c6b-8a6b-528e-b4bd-a4b897500b49" version = "0.9.4" [[ImageMorphology]] deps = ["ColorVectorSpace", "ImageCore", "LinearAlgebra", "TiledIteration"] git-tree-sha1 = "113df7743f1e18da5f5ea5f98eb59ceb77092734" uuid = "787d08f9-d448-5407-9aad-5290dd7ab264" version = "0.2.9" [[ImageQualityIndexes]] deps = ["ColorVectorSpace", "ImageCore", "ImageDistances", "ImageFiltering", "OffsetArrays", "Statistics"] git-tree-sha1 = "80484f9e1beae36860ed8022f195d04c751cfec6" uuid = "2996bd0c-7a13-11e9-2da2-2f5ce47296a9" version = "0.2.1" [[ImageShow]] deps = ["Base64", "FileIO", "ImageCore", "Requires"] git-tree-sha1 = "c9df184bc7c2e665f971079174aabb7d18f1845f" uuid = "4e3cecfd-b093-5904-9786-8bbb286a6a31" version = "0.2.3" [[ImageTransformations]] deps = ["AxisAlgorithms", "ColorVectorSpace", "CoordinateTransformations", "IdentityRanges", "ImageCore", "Interpolations", "OffsetArrays", "Rotations", "StaticArrays"] git-tree-sha1 = "0426a62ca1a23f3b1ee75cc0e47320d859abd6ae" uuid = "02fcd773-0e25-5acc-982a-7f6622650795" version = "0.8.9" [[Images]] deps = ["AxisArrays", "Base64", "ColorVectorSpace", "FileIO", "Graphics", "ImageAxes", "ImageContrastAdjustment", "ImageCore", "ImageDistances", "ImageFiltering", "ImageMetadata", "ImageMorphology", "ImageQualityIndexes", "ImageShow", "ImageTransformations", "IndirectArrays", "OffsetArrays", "Random", "Reexport", "SparseArrays", "StaticArrays", "Statistics", "StatsBase", "TiledIteration"] git-tree-sha1 = "535bcaae047f017f4fd7331ee859b75f2b27e505" uuid = "916415d5-f1e6-5110-898d-aaa5f9f070e0" version = "0.23.3" [[IndirectArrays]] git-tree-sha1 = "c2a145a145dc03a7620af1444e0264ef907bd44f" uuid = "9b13fd28-a010-5f03-acff-a1bbcff69959" version = "0.5.1" [[IniFile]] deps = ["Test"] git-tree-sha1 = "098e4d2c533924c921f9f9847274f2ad89e018b8" uuid = "83e8ac13-25f8-5344-8a64-a9f2b223428f" version = "0.5.0" [[IntelOpenMP_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "d979e54b71da82f3a65b62553da4fc3d18c9004c" uuid = "1d5cc7b8-4909-519e-a0f8-d0f5ad9712d0" version = "2018.0.3+2" [[InteractiveUtils]] deps = ["Markdown"] uuid = "b77e0a4c-d291-57a0-90e8-8db25a27a240" [[Interpolations]] deps = ["AxisAlgorithms", "LinearAlgebra", "OffsetArrays", "Random", "Ratios", "SharedArrays", "SparseArrays", "StaticArrays", "WoodburyMatrices"] git-tree-sha1 = "eb1dd6d5b2275faaaa18533e0fc5f9171cec25fa" uuid = "a98d9a8b-a2ab-59e6-89dd-64a1c18fca59" version = "0.13.1" [[IntervalSets]] deps = ["Dates", "EllipsisNotation", "Statistics"] git-tree-sha1 = "93a6d78525feb0d3ee2a2ae83a7d04db1db5663f" uuid = "8197267c-284f-5f27-9208-e0e47529a953" version = "0.5.2" [[InvertedIndices]] deps = ["Test"] git-tree-sha1 = "15732c475062348b0165684ffe28e85ea8396afc" uuid = "41ab1584-1d38-5bbf-9106-f11c6c58b48f" version = "1.0.0" [[IterTools]] git-tree-sha1 = "05110a2ab1fc5f932622ffea2a003221f4782c18" uuid = "c8e1da08-722c-5040-9ed9-7db0dc04731e" version = "1.3.0" [[IteratorInterfaceExtensions]] git-tree-sha1 = "a3f24677c21f5bbe9d2a714f95dcd58337fb2856" uuid = "82899510-4779-5014-852e-03e436cf321d" version = "1.0.0" [[JLLWrappers]] git-tree-sha1 = "a431f5f2ca3f4feef3bd7a5e94b8b8d4f2f647a0" uuid = "692b3bcd-3c85-4b1f-b108-f13ce0eb3210" version = "1.2.0" [[JSON]] deps = ["Dates", "Mmap", "Parsers", "Unicode"] git-tree-sha1 = "81690084b6198a2e1da36fcfda16eeca9f9f24e4" uuid = "682c06a0-de6a-54ab-a142-c8b1cf79cde6" version = "0.21.1" [[JpegTurbo_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "9aff0587d9603ea0de2c6f6300d9f9492bbefbd3" uuid = "aacddb02-875f-59d6-b918-886e6ef4fbf8" version = "2.0.1+3" [[Juno]] deps = ["Base64", "Logging", "Media", "Profile"] git-tree-sha1 = "07cb43290a840908a771552911a6274bc6c072c7" uuid = "e5e0dc1b-0480-54bc-9374-aad01c23163d" version = "0.8.4" [[LLVM]] deps = ["CEnum", "Libdl", "Printf", "Unicode"] git-tree-sha1 = "b616937c31337576360cb9fb872ec7633af7b194" uuid = "929cbde3-209d-540e-8aea-75f648917ca0" version = "3.6.0" [[LibGit2]] deps = ["Printf"] uuid = "76f85450-5226-5b5a-8eaa-529ad045b433" [[Libdl]] uuid = "8f399da3-3557-5675-b5ff-fb832c97cbdb" [[Libtiff_jll]] deps = ["Artifacts", "JLLWrappers", "JpegTurbo_jll", "Libdl", "Pkg", "Zlib_jll", "Zstd_jll"] git-tree-sha1 = "291dd857901f94d683973cdf679984cdf73b56d0" uuid = "89763e89-9b03-5906-acba-b20f662cd828" version = "4.1.0+2" [[LinearAlgebra]] deps = ["Libdl"] uuid = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e" [[Logging]] uuid = "56ddb016-857b-54e1-b83d-db4d58db5568" [[MKL_jll]] deps = ["IntelOpenMP_jll", "Libdl", "Pkg"] git-tree-sha1 = "eb540ede3aabb8284cb482aa41d00d6ca850b1f8" uuid = "856f044c-d86e-5d09-b602-aeab76dc8ba7" version = "2020.2.254+0" [[MacroTools]] deps = ["Markdown", "Random"] git-tree-sha1 = "6a8a2a625ab0dea913aba95c11370589e0239ff0" uuid = "1914dd2f-81c6-5fcd-8719-6d5c9610ff09" version = "0.5.6" [[MappedArrays]] deps = ["FixedPointNumbers"] git-tree-sha1 = "b92bd220c95a8bbe89af28f11201fd080e0e3fe7" uuid = "dbb5928d-eab1-5f90-85c2-b9b0edb7c900" version = "0.3.0" [[Markdown]] deps = ["Base64"] uuid = "d6f4376e-aef5-505a-96c1-9c027394607a" [[MbedTLS]] deps = ["Dates", "MbedTLS_jll", "Random", "Sockets"] git-tree-sha1 = "1c38e51c3d08ef2278062ebceade0e46cefc96fe" uuid = "739be429-bea8-5141-9913-cc70e7f3736d" version = "1.0.3" [[MbedTLS_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "0eef589dd1c26a3ac9d753fe1a8bcad63f956fa6" uuid = "c8ffd9c3-330d-5841-b78e-0817d7145fa1" version = "2.16.8+1" [[Media]] deps = ["MacroTools", "Test"] git-tree-sha1 = "75a54abd10709c01f1b86b84ec225d26e840ed58" uuid = "e89f7d12-3494-54d1-8411-f7d8b9ae1f27" version = "0.5.0" [[Metalhead]] deps = ["BSON", "ColorTypes", "Flux", "ImageFiltering", "Images", "REPL", "Requires", "Statistics"] git-tree-sha1 = "f977250f801e0f61ba11425bbb1d83778eae5c4b" uuid = "dbeba491-748d-5e0e-a39e-b530a07fa0cc" version = "0.5.2" [[Missings]] deps = ["DataAPI"] git-tree-sha1 = "f8c673ccc215eb50fcadb285f522420e29e69e1c" uuid = "e1d29d7a-bbdc-5cf2-9ac0-f12de2c33e28" version = "0.4.5" [[Mmap]] uuid = "a63ad114-7e13-5084-954f-fe012c677804" [[MosaicViews]] deps = ["MappedArrays", "OffsetArrays", "PaddedViews"] git-tree-sha1 = "614e8d77264d20c1db83661daadfab38e8e4b77e" uuid = "e94cdb99-869f-56ef-bcf0-1ae2bcbe0389" version = "0.2.4" [[MsgPack]] deps = ["Serialization"] git-tree-sha1 = "a8cbf066b54d793b9a48c5daa5d586cf2b5bd43d" uuid = "99f44e22-a591-53d1-9472-aa23ef4bd671" version = "1.1.0" [[NNlib]] deps = ["ChainRulesCore", "Compat", "LinearAlgebra", "Pkg", "Requires", "Statistics"] git-tree-sha1 = "df42d0816edfc24f5b82a728f46381613c4dff79" uuid = "872c559c-99b0-510c-b3b7-b6c96a88d5cd" version = "0.7.14" [[NaNMath]] git-tree-sha1 = "bfe47e760d60b82b66b61d2d44128b62e3a369fb" uuid = "77ba4419-2d1f-58cd-9bb1-8ffee604a2e3" version = "0.3.5" [[Netpbm]] deps = ["ColorVectorSpace", "FileIO", "ImageCore"] git-tree-sha1 = "03472ec5ea8884b791c6340712f3261c0f393691" uuid = "f09324ee-3d7c-5217-9330-fc30815ba969" version = "1.0.0" [[OffsetArrays]] deps = ["Adapt"] git-tree-sha1 = "76622f08645764e040b4d7e86d0ff471fd126ae4" uuid = "6fe1bfb0-de20-5000-8ca7-80f57d26f881" version = "1.5.3" [[OpenSpecFun_jll]] deps = ["Artifacts", "CompilerSupportLibraries_jll", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "9db77584158d0ab52307f8c04f8e7c08ca76b5b3" uuid = "efe28fd5-8261-553b-a9e1-b2916fc3738e" version = "0.5.3+4" [[OrderedCollections]] git-tree-sha1 = "d45739abcfc03b51f6a42712894a593f74c80a23" uuid = "bac558e1-5e72-5ebc-8fee-abe8a469f55d" version = "1.3.3" [[PNGFiles]] deps = ["Base64", "CEnum", "ImageCore", "IndirectArrays", "OffsetArrays", "libpng_jll"] git-tree-sha1 = "aa6e87a2361c2fe5a63b1a6a4b567f13aa108991" uuid = "f57f5aa1-a3ce-4bc8-8ab9-96f992907883" version = "0.3.5" [[PaddedViews]] deps = ["OffsetArrays"] git-tree-sha1 = "0fa5e78929aebc3f6b56e1a88cf505bb00a354c4" uuid = "5432bcbf-9aad-5242-b902-cca2824c8663" version = "0.5.8" [[Parameters]] deps = ["OrderedCollections", "UnPack"] git-tree-sha1 = "2276ac65f1e236e0a6ea70baff3f62ad4c625345" uuid = "d96e819e-fc66-5662-9728-84c9c7592b0a" version = "0.12.2" [[Parsers]] deps = ["Dates"] git-tree-sha1 = "50c9a9ed8c714945e01cd53a21007ed3865ed714" uuid = "69de0a69-1ddd-5017-9359-2bf0b02dc9f0" version = "1.0.15" [[Pkg]] deps = ["Dates", "LibGit2", "Libdl", "Logging", "Markdown", "Printf", "REPL", "Random", "SHA", "UUIDs"] uuid = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f" [[Pluto]] deps = ["Base64", "Dates", "Distributed", "FuzzyCompletions", "HTTP", "InteractiveUtils", "Logging", "Markdown", "MsgPack", "Pkg", "REPL", "Sockets", "Tables", "UUIDs"] git-tree-sha1 = "fe1fdbff28f179216a1e756bd5494057b036945f" uuid = "c3e4b0f8-55cb-11ea-2926-15256bba5781" version = "0.12.20" [[PooledArrays]] deps = ["DataAPI"] git-tree-sha1 = "0e8f5c428a41a81cd71f76d76f2fc3415fe5a676" uuid = "2dfb63ee-cc39-5dd5-95bd-886bf059d720" version = "1.1.0" [[PrettyTables]] deps = ["Crayons", "Formatting", "Markdown", "Reexport", "Tables"] git-tree-sha1 = "574a6b3ea95f04e8757c0280bb9c29f1a5e35138" uuid = "08abe8d2-0d0c-5749-adfa-8a2ac140af0d" version = "0.11.1" [[Printf]] deps = ["Unicode"] uuid = "de0858da-6303-5e67-8744-51eddeeeb8d7" [[Profile]] deps = ["Printf"] uuid = "9abbd945-dff8-562f-b5e8-e1ebf5ef1b79" [[REPL]] deps = ["InteractiveUtils", "Markdown", "Sockets"] uuid = "3fa0cd96-eef1-5676-8a61-b3b8758bbffb" [[Random]] deps = ["Serialization"] uuid = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c" [[RangeArrays]] git-tree-sha1 = "b9039e93773ddcfc828f12aadf7115b4b4d225f5" uuid = "b3c3ace0-ae52-54e7-9d0b-2c1406fd6b9d" version = "0.3.2" [[Ratios]] git-tree-sha1 = "37d210f612d70f3f7d57d488cb3b6eff56ad4e41" uuid = "c84ed2f1-dad5-54f0-aa8e-dbefe2724439" version = "0.4.0" [[Reexport]] git-tree-sha1 = "57d8440b0c7d98fc4f889e478e80f268d534c9d5" uuid = "189a3867-3050-52da-a836-e630ba90ab69" version = "1.0.0" [[Requires]] deps = ["UUIDs"] git-tree-sha1 = "cfbac6c1ed70c002ec6361e7fd334f02820d6419" uuid = "ae029012-a4dd-5104-9daa-d747884805df" version = "1.1.2" [[Rotations]] deps = ["LinearAlgebra", "StaticArrays", "Statistics"] git-tree-sha1 = "2ed8d8a16d703f900168822d83699b8c3c1a5cd8" uuid = "6038ab10-8711-5258-84ad-4b1120ba62dc" version = "1.0.2" [[SHA]] uuid = "ea8e919c-243c-51af-8825-aaa63cd721ce" [[Scratch]] deps = ["Dates"] git-tree-sha1 = "ad4b278adb62d185bbcb6864dc24959ab0627bf6" uuid = "6c6a2e73-6563-6170-7368-637461726353" version = "1.0.3" [[SentinelArrays]] deps = ["Dates", "Random"] git-tree-sha1 = "6ccde405cf0759eba835eb613130723cb8f10ff9" uuid = "91c51154-3ec4-41a3-a24f-3f23e20d615c" version = "1.2.16" [[Serialization]] uuid = "9e88b42a-f829-5b0c-bbe9-9e923198166b" [[SharedArrays]] deps = ["Distributed", "Mmap", "Random", "Serialization"] uuid = "1a1011a3-84de-559e-8e89-a11a2f7dc383" [[SimpleTraits]] deps = ["InteractiveUtils", "MacroTools"] git-tree-sha1 = "daf7aec3fe3acb2131388f93a4c409b8c7f62226" uuid = "699a6c99-e7fa-54fc-8d76-47d257e15c1d" version = "0.9.3" [[Sockets]] uuid = "6462fe0b-24de-5631-8697-dd941f90decc" [[SortingAlgorithms]] deps = ["DataStructures", "Random", "Test"] git-tree-sha1 = "03f5898c9959f8115e30bc7226ada7d0df554ddd" uuid = "a2af1166-a08f-5f64-846c-94a0d3cef48c" version = "0.3.1" [[SparseArrays]] deps = ["LinearAlgebra", "Random"] uuid = "2f01184e-e22b-5df5-ae63-d93ebab69eaf" [[SpecialFunctions]] deps = ["ChainRulesCore", "OpenSpecFun_jll"] git-tree-sha1 = "75394dbe2bd346beeed750fb02baa6445487b862" uuid = "276daf66-3868-5448-9aa4-cd146d93841b" version = "1.2.1" [[StaticArrays]] deps = ["LinearAlgebra", "Random", "Statistics"] git-tree-sha1 = "9da72ed50e94dbff92036da395275ed114e04d49" uuid = "90137ffa-7385-5640-81b9-e52037218182" version = "1.0.1" [[Statistics]] deps = ["LinearAlgebra", "SparseArrays"] uuid = "10745b16-79ce-11e8-11f9-7d13ad32a3b2" [[StatsBase]] deps = ["DataAPI", "DataStructures", "LinearAlgebra", "Missings", "Printf", "Random", "SortingAlgorithms", "SparseArrays", "Statistics"] git-tree-sha1 = "7bab7d4eb46b225b35179632852b595a3162cb61" uuid = "2913bbd2-ae8a-5f71-8c99-4fb6c76f3a91" version = "0.33.2" [[StructTypes]] deps = ["Dates", "UUIDs"] git-tree-sha1 = "65a43f5218197bc7091b76bc273a5e323a1d7b0d" uuid = "856f2bd8-1eba-4b0a-8007-ebc267875bd4" version = "1.2.3" [[TableTraits]] deps = ["IteratorInterfaceExtensions"] git-tree-sha1 = "b1ad568ba658d8cbb3b892ed5380a6f3e781a81e" uuid = "3783bdb8-4a98-5b6b-af9a-565f29a5fe9c" version = "1.0.0" [[Tables]] deps = ["DataAPI", "DataValueInterfaces", "IteratorInterfaceExtensions", "LinearAlgebra", "TableTraits", "Test"] git-tree-sha1 = "a716dde43d57fa537a19058d044b495301ba6565" uuid = "bd369af6-aec1-5ad0-b16a-f7cc5008161c" version = "1.3.2" [[Test]] deps = ["Distributed", "InteractiveUtils", "Logging", "Random"] uuid = "8dfed614-e22c-5e08-85e1-65c5234f0b40" [[TiledIteration]] deps = ["OffsetArrays"] git-tree-sha1 = "05f74c5b3c00d5336bc109416df2df907e3bd91d" uuid = "06e1c1a7-607b-532d-9fad-de7d9aa2abac" version = "0.2.5" [[TimerOutputs]] deps = ["Printf"] git-tree-sha1 = "3318281dd4121ecf9713ce1383b9ace7d7476fdd" uuid = "a759f4b9-e2f1-59dc-863e-4aeb61b1ea8f" version = "0.5.7" [[TranscodingStreams]] deps = ["Random", "Test"] git-tree-sha1 = "7c53c35547de1c5b9d46a4797cf6d8253807108c" uuid = "3bb67fe8-82b1-5028-8e26-92a6c54297fa" version = "0.9.5" [[URIs]] git-tree-sha1 = "7855809b88d7b16e9b029afd17880930626f54a2" uuid = "5c2747f8-b7ea-4ff2-ba2e-563bfd36b1d4" version = "1.2.0" [[UUIDs]] deps = ["Random", "SHA"] uuid = "cf7118a7-6976-5b1a-9a39-7adc72f591a4" [[UnPack]] git-tree-sha1 = "387c1f73762231e86e0c9c5443ce3b4a0a9a0c2b" uuid = "3a884ed6-31ef-47d7-9d2a-63182c4928ed" version = "1.0.2" [[Unicode]] uuid = "4ec0a83e-493e-50e2-b9ac-8f72acf5a8f5" [[WoodburyMatrices]] deps = ["LinearAlgebra", "SparseArrays"] git-tree-sha1 = "59e2ad8fd1591ea019a5259bd012d7aee15f995c" uuid = "efce3f68-66dc-5838-9240-27a6d6f5f9b6" version = "0.5.3" [[ZipFile]] deps = ["Libdl", "Printf", "Zlib_jll"] git-tree-sha1 = "c3a5637e27e914a7a445b8d0ad063d701931e9f7" uuid = "a5390f91-8eb1-5f08-bee0-b1d1ffed6cea" version = "0.9.3" [[Zlib_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "320228915c8debb12cb434c59057290f0834dbf6" uuid = "83775a58-1f1d-513f-b197-d71354ab007a" version = "1.2.11+18" [[Zstd_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg"] git-tree-sha1 = "2c1332c54931e83f8f94d310fa447fd743e8d600" uuid = "3161d3a3-bdf6-5164-811a-617609db77b4" version = "1.4.8+0" [[Zygote]] deps = ["AbstractFFTs", "ChainRules", "DiffRules", "Distributed", "FillArrays", "ForwardDiff", "IRTools", "InteractiveUtils", "LinearAlgebra", "MacroTools", "NaNMath", "Random", "Requires", "SpecialFunctions", "Statistics", "ZygoteRules"] git-tree-sha1 = "52835a83f7c899cfcb95f796d584201812887ea8" uuid = "e88e6eb3-aa80-5325-afca-941959d7151f" version = "0.6.3" [[ZygoteRules]] deps = ["MacroTools"] git-tree-sha1 = "9e7a1e8ca60b742e508a315c17eef5211e7fbfd7" uuid = "700de1a5-db45-46bc-99cf-38207098b444" version = "0.2.1" [[libpng_jll]] deps = ["Artifacts", "JLLWrappers", "Libdl", "Pkg", "Zlib_jll"] git-tree-sha1 = "6abbc424248097d69c0c87ba50fcb0753f93e0ee" uuid = "b53b4c65-9356-5827-b1ea-8c7a1a84506f" version = "1.6.37+6" ```

Version info

Details on Julia (compiled Julia from sources, Ubuntu 20.04):

Julia Version 1.5.3
Commit 788b2c77c1 (2020-11-09 13:37 UTC)
Platform Info:
  OS: Linux (x86_64-linux-gnu)
  CPU: AMD Ryzen 9 5950X 16-Core Processor
  WORD_SIZE: 64
  LIBM: libopenlibm
  LLVM: libLLVM-9.0.1 (ORCJIT, generic)
Environment:
  JULIA_DEBUG = CUBLAS

Details on CUDA:

CUDA toolkit 11.1.1, artifact installation
CUDA driver 11.2.0
NVIDIA driver 460.32.3

Libraries: 
- CUBLAS: 11.4.1
- CURAND: 10.2.2
- CUFFT: 10.3.0
- CUSOLVER: 11.0.1
- CUSPARSE: 11.3.0
- CUPTI: 14.0.0
- NVML: 11.0.0+460.32.3
- CUDNN: 8.0.4 (for CUDA 11.1.0)
- CUTENSOR: 1.2.1 (for CUDA 11.1.0)

Toolchain:
- Julia: 1.5.3
- LLVM: 9.0.1
- PTX ISA support: 3.2, 4.0, 4.1, 4.2, 4.3, 5.0, 6.0, 6.1, 6.3, 6.4
- Device support: sm_35, sm_37, sm_50, sm_52, sm_53, sm_60, sm_61, sm_62, sm_70, sm_72, sm_75

1 device:
  0: GeForce RTX 3090 (sm_86, 22.438 GiB / 23.691 GiB available)
maleadt commented 3 years ago

I found this forum-post, maybe it is related?

No, that post details CUBLAS_STATUS_NOT_SUPPORTED for Int8 multiplication. You are getting CUBLAS_STATUS_ARCH_MISMATCH for a Float16=Float16*Float16 GEMM. This looks like a CUBLAS bug... You could try upgrading to CUDA 11.2 by using the CUDA.jl master branch.

Talinx commented 3 years ago

You could try upgrading to CUDA 11.2 by using the CUDA.jl master branch.

Thank you, that works! (Julia 1.6.0-rc1, CUDA.jl from master, CUDA 11.2.0) ] test CUDA also works now (except 3 from device/intrinsics, same as in https://github.com/JuliaGPU/CUDA.jl/issues/711).

maleadt commented 3 years ago

It looks like several people are running into this, but I don't have a clear debug log yet that points to the failing invocation of gemmEx. So for those with this issue, please run with JULIA_DEBUG=CUBLAS (requires master branch, or compat for 1.5), and please try to reduce to an MWE (i.e. not just running the entire test suite). Comparing CUDA 11.1 to 11.2 (which you can force by starting Julia with JULIA_CUDA_VERSION set to respectively 11.1 or 11.2) would be helpful here too.

cchan commented 3 years ago

Coming here from #722 and feeling silly now because JULIA_CUDA_VERSION=11.2 actually made it work correctly. Not sure why it didn't try to use those artifacts automatically, since everything in my environment has version 11.2 (er, or 11.3). Also, it still doesn't work with the local toolkit. If it helps, here's my info:

repro:

using CUDA
a = CUDA.rand(2,2)
b = CUDA.rand(2,2)
a * b

Notably, a+b works fine.

Environment info:

$ nvcc --version
nvcc: NVIDIA (R) Cuda compiler driver
Copyright (c) 2005-2021 NVIDIA Corporation
Built on Thu_Jan_28_19:32:09_PST_2021
Cuda compilation tools, release 11.2, V11.2.142
Build cuda_11.2.r11.2/compiler.29558016_0
$ nvdisasm --version
nvdisasm: NVIDIA (R) CUDA disassembler
Copyright (c) 2005-2021 NVIDIA Corporation
Built on Tue_Jan_19_19:22:01_PST_2021
Cuda compilation tools, release 11.2, V11.2.135
Build cuda_11.2.r11.2/compiler.29518894_0
+-----------------------------------------------------------------------------+
| NVIDIA-SMI 465.51       Driver Version: 465.51       CUDA Version: 11.3     |
|-------------------------------+----------------------+----------------------+
| GPU  Name            TCC/WDDM | Bus-Id        Disp.A | Volatile Uncorr. ECC |
| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |
|                               |                      |               MIG M. |
|===============================+======================+======================|
|   0  NVIDIA GeForce ... WDDM  | 00000000:09:00.0  On |                  N/A |
|  0%   53C    P8     9W / 175W |   2975MiB /  8192MiB |      1%      Default |
|                               |                      |                  N/A |
+-------------------------------+----------------------+----------------------+
julia> CUDA.version()
v"11.3.0"

Using 11.2:

$ JULIA_CUDA_VERSION=11.2 JULIA_DEBUG=CUBLAS julia src/test.jl
  Downloaded artifact: CUDA112
I! cuBLAS (v11.2) function cublasStatus_t cublasCreate_v2(cublasContext**) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0x7ffd10a64930)
i! Time: 2021-02-19T07:13:36 elapsed from start 0.033333 minutes or 2.000000 seconds
i!Process=14055; Thread=140220191823680; GPU=0; Handle=POINTER (IN HEX:0x(nil))
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)
I! cuBLAS (v11.2) function cublasStatus_t cublasSetStream_v2(cublasHandle_t, cudaStream_t) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0xa8af7b0)
i!  streamId: type=SOME TYPE; val=POINTER (IN HEX:0x0x2)
i! Time: 2021-02-19T07:13:36 elapsed from start 0.033333 minutes or 2.000000 seconds
i!Process=14055; Thread=140220191823680; GPU=0; Handle=POINTER (IN HEX:0x0xa8af7b0); StreamId=POINTER (IN HEX:0x(nil)) (defaultStream); MathMode=CUBLAS_DEFAULT_MATH
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)
I! cuBLAS (v11.2) function cublasStatus_t cublasSetWorkspace_v2(cublasHandle_t, void*, size_t) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0xa8af7b0)
i!  workspace: type=void; val=POINTER (IN HEX:0x0x70fd60000)
i!  workspaceSizeInBytes: type=SOME TYPE; val=4194304
i! Time: 2021-02-19T07:13:36 elapsed from start 0.033333 minutes or 2.000000 seconds
i!Process=14055; Thread=140220191823680; GPU=0; Handle=POINTER (IN HEX:0x0xa8af7b0); StreamId=POINTER (IN HEX:0x0x2); MathMode=CUBLAS_DEFAULT_MATH
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)
I! cuBLAS (v11.2) function cublasStatus_t cublasSetMathMode(cublasHandle_t, cublasMath_t) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0xa8af7b0)
i!  mode: type=cublasMath_t; val=CUBLAS_DEFAULT_MATH | CUBLAS_MATH_DISALLOW_REDUCED_PRECISION_REDUCTION(16)
i! Time: 2021-02-19T07:13:36 elapsed from start 0.033333 minutes or 2.000000 seconds
i!Process=14055; Thread=140220191823680; GPU=0; Handle=POINTER (IN HEX:0x0xa8af7b0); StreamId=POINTER (IN HEX:0x0x2); MathMode=CUBLAS_DEFAULT_MATH
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)
I! cuBLAS (v11.2) function cublasStatus_t cublasGemmEx(cublasHandle_t, cublasOperation_t, cublasOperation_t, int, int, int, const void*, const void*, cudaDataType_t, int, const void*, cudaDataType_t, int, const void*, void*, cudaDataType_t, int, cublasComputeType_t, cublasGemmAlgo_t) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0xa8af7b0)
i!  transa: type=cublasOperation_t; val=CUBLAS_OP_N(0)
i!  transb: type=cublasOperation_t; val=CUBLAS_OP_N(0)
i!  m: type=int; val=2
i!  n: type=int; val=2
i!  k: type=int; val=2
i!  alpha: type=void; val=POINTER (IN HEX:0x0x7f871ad2c290)
i!  A: type=void; val=POINTER (IN HEX:0x0x705790000)
i!  Atype: type=cudaDataType_t; val=CUDA_R_32F(0)
i!  lda: type=int; val=2
i!  B: type=void; val=POINTER (IN HEX:0x0x705790200)
i!  Btype: type=cudaDataType_t; val=CUDA_R_32F(0)
i!  ldb: type=int; val=2
i!  beta: type=void; val=POINTER (IN HEX:0x0x7f871ad2c2a0)
i!  C: type=void; val=POINTER (IN HEX:0x0x705790400)
i!  Ctype: type=cudaDataType_t; val=CUDA_R_32F(0)
i!  ldc: type=int; val=2
i!  computeType: type=cublasComputeType_t; val=CUBLAS_COMPUTE_32F(68)
i!  algo: type=SOME TYPE; val=CUBLAS_GEMM_DEFAULT(-1)
i! Time: 2021-02-19T07:13:36 elapsed from start 0.033333 minutes or 2.000000 seconds
i!Process=14055; Thread=140220191823680; GPU=0; Handle=POINTER (IN HEX:0x0xa8af7b0); StreamId=POINTER (IN HEX:0x0x2); MathMode=CUBLAS_DEFAULT_MATH | CUBLAS_MATH_DISALLOW_REDUCED_PRECISION_REDUCTION
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)
I! cuBLAS (v11.2) function cublasStatus_t cublasDestroy_v2(cublasHandle_t) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0xa8af7b0)
i! Time: 2021-02-19T07:13:37 elapsed from start 0.050000 minutes or 3.000000 seconds
i!Process=14055; Thread=140220191823680; GPU=0; Handle=POINTER (IN HEX:0x0xa8af7b0); StreamId=POINTER (IN HEX:0x0x2); MathMode=CUBLAS_DEFAULT_MATH | CUBLAS_MATH_DISALLOW_REDUCED_PRECISION_REDUCTION
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)

Using 11.1:

$ JULIA_CUDA_VERSION=11.1 JULIA_DEBUG=CUBLAS julia src/test.jl
I! cuBLAS (v11.1) function cublasStatus_t cublasCreate_v2(cublasContext**) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0x7fff4e976470)
i! Time: 2021-02-19T07:11:27 elapsed from start 0.016667 minutes or 1.000000 seconds
i!Process=14012; Thread=139705143056192; GPU=0; Handle=POINTER (IN HEX:0x(nil))
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)
I! cuBLAS (v11.1) function cublasStatus_t cublasSetStream_v2(cublasHandle_t, cudaStream_t) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0xbd23810)
i!  streamId: type=SOME TYPE; val=POINTER (IN HEX:0x0x2)
i! Time: 2021-02-19T07:11:28 elapsed from start 0.033333 minutes or 2.000000 seconds
i!Process=14012; Thread=139705143056192; GPU=0; Handle=POINTER (IN HEX:0x0xbd23810); StreamId=POINTER (IN HEX:0x(nil)) (defaultStream); MathMode=CUBLAS_DEFAULT_MATH
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)
I! cuBLAS (v11.1) function cublasStatus_t cublasSetWorkspace_v2(cublasHandle_t, void*, size_t) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0xbd23810)
i!  workspace: type=void; val=POINTER (IN HEX:0x0x70fd60000)
i!  workspaceSizeInBytes: type=SOME TYPE; val=4194304
i! Time: 2021-02-19T07:11:28 elapsed from start 0.033333 minutes or 2.000000 seconds
i!Process=14012; Thread=139705143056192; GPU=0; Handle=POINTER (IN HEX:0x0xbd23810); StreamId=POINTER (IN HEX:0x0x2); MathMode=CUBLAS_DEFAULT_MATH
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)
I! cuBLAS (v11.1) function cublasStatus_t cublasSetMathMode(cublasHandle_t, cublasMath_t) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0xbd23810)
i!  mode: type=cublasMath_t; val=CUBLAS_DEFAULT_MATH | CUBLAS_MATH_DISALLOW_REDUCED_PRECISION_REDUCTION(16)
i! Time: 2021-02-19T07:11:28 elapsed from start 0.033333 minutes or 2.000000 seconds
i!Process=14012; Thread=139705143056192; GPU=0; Handle=POINTER (IN HEX:0x0xbd23810); StreamId=POINTER (IN HEX:0x0x2); MathMode=CUBLAS_DEFAULT_MATH
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)
I! cuBLAS (v11.1) function cublasStatus_t cublasGemmEx(cublasHandle_t, cublasOperation_t, cublasOperation_t, int, int, int, const void*, const void*, cudaDataType_t, int, const void*, cudaDataType_t, int, const void*, void*, cudaDataType_t, int, cublasComputeType_t, cublasGemmAlgo_t) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0xbd23810)
i!  transa: type=cublasOperation_t; val=CUBLAS_OP_N(0)
i!  transb: type=cublasOperation_t; val=CUBLAS_OP_N(0)
i!  m: type=int; val=2
i!  n: type=int; val=2
i!  k: type=int; val=2
i!  alpha: type=void; val=POINTER (IN HEX:0x0x7f0f2968b720)
i!  A: type=void; val=POINTER (IN HEX:0x0x705790000)
i!  Atype: type=cudaDataType_t; val=CUDA_R_32F(0)
i!  B: type=void; val=POINTER (IN HEX:0x0x705790200)
i!  Btype: type=cudaDataType_t; val=CUDA_R_32F(0)
i!  ldb: type=int; val=2
i!  beta: type=void; val=POINTER (IN HEX:0x0x7f0f2968b730)
i!  C: type=void; val=POINTER (IN HEX:0x0x705790400)
i!  Ctype: type=cudaDataType_t; val=CUDA_R_32F(0)
i!  ldc: type=int; val=2
i!  computeType: type=cublasComputeType_t; val=CUBLAS_COMPUTE_32F(68)
i!  algo: type=SOME TYPE; val=CUBLAS_GEMM_DEFAULT(-1)
i! Time: 2021-02-19T07:11:28 elapsed from start 0.033333 minutes or 2.000000 seconds
i!Process=14012; Thread=139705143056192; GPU=0; Handle=POINTER (IN HEX:0x0xbd23810); StreamId=POINTER (IN HEX:0x0x2); MathMode=CUBLAS_DEFAULT_MATH | CUBLAS_MATH_DISALLOW_REDUCED_PRECISION_REDUCTION
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)
ERROR: LoadError: CUBLASError: an absent device architectural feature is required (code 8, CUBLAS_STATUS_ARCH_MISMATCH)
Stacktrace:
  [1] throw_api_error(res::CUDA.CUBLAS.cublasStatus_t)
    @ CUDA.CUBLAS ~/.julia/packages/CUDA/Zmd60/lib/cublas/error.jl:47
  [2] macro expansion
    @ ~/.julia/packages/CUDA/Zmd60/lib/cublas/error.jl:58 [inlined]
  [3] cublasGemmEx(handle::Ptr{Nothing}, transa::Char, transb::Char, m::Int64, n::Int64, k::Int64, alpha::Base.RefValue{Float32}, A::CuArray{Float32, 2}, Atype::Type, lda::Int64, B::CuArray{Float32, 2}, Btype::Type, ldb::Int64, beta::Base.RefValue{Float32}, C::CuArray{Float32, 2}, Ctype::Type, ldc::Int64, computeType::CUDA.CUBLAS.cublasComputeType_t, algo::CUDA.CUBLAS.cublasGemmAlgo_t)
    @ CUDA.CUBLAS ~/.julia/packages/CUDA/Zmd60/lib/utils/call.jl:26
  [4] gemmEx!(transA::Char, transB::Char, alpha::Number, A::Union{CuVecOrMat{T}, DenseCuVecOrMat{T}} where T, B::Union{CuVecOrMat{T}, DenseCuVecOrMat{T}} where T, beta::Number, C::Union{CuVecOrMat{T}, DenseCuVecOrMat{T}} where T; algo::CUDA.CUBLAS.cublasGemmAlgo_t)
    @ CUDA.CUBLAS ~/.julia/packages/CUDA/Zmd60/lib/cublas/wrappers.jl:837
  [5] gemmEx!
    @ ~/.julia/packages/CUDA/Zmd60/lib/cublas/wrappers.jl:819 [inlined]
  [6] gemm_dispatch!(C::CuArray{Float32, 2}, A::CuArray{Float32, 2}, B::CuArray{Float32, 2}, alpha::Bool, beta::Bool)
    @ CUDA.CUBLAS ~/.julia/packages/CUDA/Zmd60/lib/cublas/linalg.jl:222
  [7] mul!
    @ ~/.julia/packages/CUDA/Zmd60/lib/cublas/linalg.jl:233 [inlined]
  [8] mul!
    @ /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.6/LinearAlgebra/src/matmul.jl:275 [inlined]
  [9] *(A::CuArray{Float32, 2}, B::CuArray{Float32, 2})
    @ LinearAlgebra /buildworker/worker/package_linux64/build/usr/share/julia/stdlib/v1.6/LinearAlgebra/src/matmul.jl:160
 [10] top-level scope
    @ [...]/src/test.jl:4
in expression starting at [...]/src/test.jl:4
I! cuBLAS (v11.1) function cublasStatus_t cublasDestroy_v2(cublasHandle_t) called:
i!  handle: type=cublasHandle_t; val=POINTER (IN HEX:0x0xbd23810)
i! Time: 2021-02-19T07:11:29 elapsed from start 0.050000 minutes or 3.000000 seconds
i!Process=14012; Thread=139705143056192; GPU=0; Handle=POINTER (IN HEX:0x0xbd23810); StreamId=POINTER (IN HEX:0x0x2); MathMode=CUBLAS_DEFAULT_MATH | CUBLAS_MATH_DISALLOW_REDUCED_PRECISION_REDUCTION
i! COMPILED WITH: GNU GCC/G++ / 5.3.1 20160406 (Red Hat 5.3.1-6)

Using local 11.2 toolkit:

$ JULIA_CUDA_USE_BINARYBUILDER=false JULIA_DEBUG=CUBLAS julia src/test.jl
┌ Error: Error during initialization of CUDA.jl
│   exception =
│    CUDA.jl does not yet support CUDA with nvdisasm 11.2.135; please file an issue.
│    Stacktrace:
│      [1] error(s::String)
│        @ Base ./error.jl:33
│      [2] parse_toolkit_version(tool::String, tool_path::String)
│        @ CUDA ~/.julia/packages/CUDA/Zmd60/deps/discovery.jl:411
│      [3] use_local_cuda()
│        @ CUDA ~/.julia/packages/CUDA/Zmd60/deps/bindeps.jl:218
│      [4] __init_dependencies__()
│        @ CUDA ~/.julia/packages/CUDA/Zmd60/deps/bindeps.jl:384
│      [5] __runtime_init__()
│        @ CUDA ~/.julia/packages/CUDA/Zmd60/src/initialization.jl:103
│      [6] macro expansion
│        @ ~/.julia/packages/CUDA/Zmd60/src/initialization.jl:32 [inlined]
│      [7] macro expansion
│        @ ./lock.jl:209 [inlined]
│      [8] _functional(show_reason::Bool)
│        @ CUDA ~/.julia/packages/CUDA/Zmd60/src/initialization.jl:26
│      [9] functional(show_reason::Bool)
│        @ CUDA ~/.julia/packages/CUDA/Zmd60/src/initialization.jl:19
│     [10] libcuda()
│        @ CUDA ~/.julia/packages/CUDA/Zmd60/src/initialization.jl:47
│     [11] macro expansion
│        @ ~/.julia/packages/CUDA/Zmd60/lib/cudadrv/libcuda.jl:29 [inlined]
│     [12] macro expansion
│        @ ~/.julia/packages/CUDA/Zmd60/lib/cudadrv/error.jl:102 [inlined]
│     [13] cuDeviceGet
│        @ ~/.julia/packages/CUDA/Zmd60/lib/utils/call.jl:26 [inlined]
│     [14] CuDevice
│        @ ~/.julia/packages/CUDA/Zmd60/lib/cudadrv/devices.jl:25 [inlined]
│     [15] initialize_thread(tid::Int64)
│        @ CUDA ~/.julia/packages/CUDA/Zmd60/src/state.jl:121
│     [16] prepare_cuda_call
│        @ ~/.julia/packages/CUDA/Zmd60/src/state.jl:80 [inlined]
│     [17] context
│        @ ~/.julia/packages/CUDA/Zmd60/src/state.jl:142 [inlined]
│     [18] default_rng()
│        @ CUDA.CURAND ~/.julia/packages/CUDA/Zmd60/lib/curand/CURAND.jl:32
│     [19] rand(dim1::Int64, dims::Int64)
│        @ CUDA ~/.julia/packages/CUDA/Zmd60/src/random.jl:70
│     [20] top-level scope
│        @ [...]/src/test.jl:2
│     [21] include(mod::Module, _path::String)
│        @ Base ./Base.jl:386
│     [22] exec_options(opts::Base.JLOptions)
│        @ Base ./client.jl:285
│     [23] _start()
│        @ Base ./client.jl:485
└ @ CUDA ~/.julia/packages/CUDA/Zmd60/src/initialization.jl:34
ERROR: LoadError: CUDA.jl did not successfully initialize, and is not usable.
If you did not see any other error message, try again in a new session
with the JULIA_DEBUG environment variable set to 'CUDA'.
Stacktrace:
  [1] error(s::String)
    @ Base ./error.jl:33
  [2] libcuda()
    @ CUDA ~/.julia/packages/CUDA/Zmd60/src/initialization.jl:48
  [3] macro expansion
    @ ~/.julia/packages/CUDA/Zmd60/lib/cudadrv/libcuda.jl:29 [inlined]
  [4] macro expansion
    @ ~/.julia/packages/CUDA/Zmd60/lib/cudadrv/error.jl:102 [inlined]
  [5] cuDeviceGet
    @ ~/.julia/packages/CUDA/Zmd60/lib/utils/call.jl:26 [inlined]
  [6] CuDevice
    @ ~/.julia/packages/CUDA/Zmd60/lib/cudadrv/devices.jl:25 [inlined]
  [7] initialize_thread(tid::Int64)
    @ CUDA ~/.julia/packages/CUDA/Zmd60/src/state.jl:121
  [8] prepare_cuda_call
    @ ~/.julia/packages/CUDA/Zmd60/src/state.jl:80 [inlined]
  [9] context
    @ ~/.julia/packages/CUDA/Zmd60/src/state.jl:142 [inlined]
 [10] default_rng()
    @ CUDA.CURAND ~/.julia/packages/CUDA/Zmd60/lib/curand/CURAND.jl:32
 [11] rand(dim1::Int64, dims::Int64)
    @ CUDA ~/.julia/packages/CUDA/Zmd60/src/random.jl:70
 [12] top-level scope
    @ [...]/src/test.jl:2
in expression starting at [...]/src/test.jl:2
maleadt commented 3 years ago

Well this is absurd; a plain Float32-based GEMM with no special flags seems to be failing here. Could you list your CUDA.versioninfo()? The nvidia-smi output is truncated and I can't see which GPU you have.

The fact that your local CUDA toolkit 11.2 Update 1 doesn't work is expected; support for that version of CUDA only lives on the CUDA.jl master branch (so you could try ]add CUDA#master). Similarly, released versions of CUDA.jl don't have the necessary CUDNN artifacts for CUDA 11.2 yet, so it doesn't auto-select that version (unless you force it using environment variables, as you noticed).

cchan commented 3 years ago

Oh okay, thanks for the explanation!

Without setting any environment variables, this is what gets installed by default:

julia> CUDA.versioninfo()
CUDA toolkit 11.1.1, artifact installation
CUDA driver 11.3.0
NVIDIA driver 465.51.0

Libraries: 
- CUBLAS: 11.4.1
- CURAND: 10.2.2
- CUFFT: 10.3.0
- CUSOLVER: 11.0.1
- CUSPARSE: 11.3.0
- CUPTI: 14.0.0
- NVML: 11.0.0+465.0
- CUDNN: 8.0.4 (for CUDA 11.1.0)
- CUTENSOR: 1.2.1 (for CUDA 11.1.0)

Toolchain:
- Julia: 1.6.0-rc1
- LLVM: 11.0.1
- PTX ISA support: 3.2, 4.0, 4.1, 4.2, 4.3, 5.0, 6.0, 6.1, 6.3, 6.4, 6.5, 7.0
- Device support: sm_35, sm_37, sm_50, sm_52, sm_53, sm_60, sm_61, sm_62, sm_70, sm_72, sm_75, sm_80

1 device:
  0: NVIDIA GeForce RTX 2070 (sm_75, 5.745 GiB / 8.000 GiB available)

Setting JULIA_CUDA_VERSION=11.2 gives this working setup:

julia> CUDA.versioninfo()
CUDA toolkit 11.2.0, artifact installation
CUDA driver 11.3.0
NVIDIA driver 465.51.0

Libraries: 
- CUBLAS: 11.4.1
- CURAND: 10.2.3
- CUFFT: 10.4.0
- CUSOLVER: 11.0.2
- CUSPARSE: 11.3.1
- CUPTI: 14.0.0
- NVML: 11.0.0+465.0
- CUDNN: missing
- CUTENSOR: missing

Toolchain:
- Julia: 1.6.0-rc1
- LLVM: 11.0.1
- PTX ISA support: 3.2, 4.0, 4.1, 4.2, 4.3, 5.0, 6.0, 6.1, 6.3, 6.4, 6.5, 7.0
- Device support: sm_35, sm_37, sm_50, sm_52, sm_53, sm_60, sm_61, sm_62, sm_70, sm_72, sm_75, sm_80

Environment:
- JULIA_CUDA_VERSION: 11.2

1 device:
  0: NVIDIA GeForce RTX 2070 (sm_75, 5.745 GiB / 8.000 GiB available)

Interestingly, some of the libraries have different version numbers but CUBLAS is not one of them.

... even more interestingly the CUDNN and CUTENSOR are missing in the working setup lmao. Is it using the system-installed CUDNN/CUTENSOR in that case? That might explain it since I'm on driver 11.3.

maleadt commented 3 years ago

... even more interestingly the CUDNN and CUTENSOR are missing in the working setup lmao

That's what I meant with:

Similarly, released versions of CUDA.jl don't have the necessary CUDNN artifacts for CUDA 11.2 yet, so it doesn't auto-select that version (unless you force it using environment variables, as you noticed).

But yeah it's funny that CUBLAS doesn't change between 11.2 and 11.2... That's not correct; what I get from the release notes is encoded here: https://github.com/JuliaGPU/CUDA.jl/blob/a34e69e7d8bc8d82f7e81559cbb6f059c5b57f88/deps/discovery.jl#L204-L231

And indeed I get:

$ JULIA_CUDA_VERSION=11.1 jl                                                                                                                                                                             [master] 
julia> using CUDA
C[ Info: Precompiling CUDA [052768ef-5323-5732-b1bb-66c8b64840ba]
UDA.versioninfo()

julia> CUDA.versioninfo()
  Downloaded artifact: CUDNN_CUDA111
  Downloaded artifact: CUTENSOR_CUDA111
CUDA toolkit 11.1.1, artifact installation
CUDA driver 11.2.0
NVIDIA driver 460.39.0

Libraries: 
- CUBLAS: 11.3.0
- CURAND: 10.2.2
- CUFFT: 10.3.0
- CUSOLVER: 11.0.1
- CUSPARSE: 11.3.0
- CUPTI: 14.0.0
- NVML: 11.0.0+460.39
- CUDNN: 8.10.0 (for CUDA 11.2.0)
- CUTENSOR: 1.2.2 (for CUDA 11.1.0)

I wonder if its picking up libcublas from anywhere else. Could you @show CUDA.libcublas()? It should be a symlink to libcublas.so.11.3.0.106 from the artifact with hash 48c41dccb8db0c9aa9483267cb33719207abe4c1.

cchan commented 3 years ago

Ah that makes sense, I'm getting CUBLAS to work at the cost of no CUDNN/CUTENSOR availability.

And indeed libcublas is exactly as you say:

julia> @show CUDA.libcublas()
CUDA.libcublas() = "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcublas.so.11"
"/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcublas.so.11"
$ ls -la /home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcublas.so.11
lrwxrwxrwx 1 clive clive 23 Feb 18 17:43 /home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcublas.so.11 -> libcublas.so.11.3.0.106

And yet we still have CUBLAS: 11.4.1 :/

maleadt commented 3 years ago

Can you show the output of Libdl.dllist() after having queried the version?

cchan commented 3 years ago

edit: all 62 elements of the vector

It's picking up the right libcublas but also libcublasLt?

julia> show(stdout, "text/plain",Libdl.dllist())
62-element Vector{String}:
 "linux-vdso.so.1"
 "/usr/lib/x86_64-linux-gnu/libdl.so.2"
 "/usr/lib/x86_64-linux-gnu/libpthread.so.0"
 "/usr/lib/x86_64-linux-gnu/libc.so.6"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/libjulia.so.1"
 "/lib64/ld-linux-x86-64.so.2"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libgcc_s.so.1"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libopenlibm.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libjulia-internal.so.1"
 "/usr/lib/x86_64-linux-gnu/libunwind.so.8"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libLLVM-11jl.so"
 "/usr/lib/x86_64-linux-gnu/librt.so.1"
 "/usr/lib/x86_64-linux-gnu/libstdc++.so.6"
 "/usr/lib/x86_64-linux-gnu/libm.so.6"
 "/usr/lib/x86_64-linux-gnu/liblzma.so.5"
 "/home/clive/packages/julias/julia-1.6/lib/julia/sys.so"
 "/usr/lib/x86_64-linux-gnu/libatomic.so.1"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libpcre2-8.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libgmp.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libmpfr.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libopenblas64_.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libgfortran.so.4"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libquadmath.so.0"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libcholmod.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libamd.so.2"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libcolamd.so.2"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libsuitesparseconfig.so.5"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libccolamd.so.2"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libcamd.so.2"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libsuitesparse_wrapper.so"
 "/usr/lib/x86_64-linux-gnu/libnghttp2.so.14"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libcurl.so"
 "/usr/lib/x86_64-linux-gnu/libssh2.so.1"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libmbedtls.so.13"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libmbedx509.so.1"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libmbedcrypto.so.5"
 "/usr/lib/x86_64-linux-gnu/libz.so.1"
 "/usr/lib/x86_64-linux-gnu/libgcrypt.so.20"
 "/usr/lib/x86_64-linux-gnu/libgpg-error.so.0"
 "/usr/lib/x86_64-linux-gnu/libgomp.so.1"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libdSFMT.so"
 "/mnt/c/Windows/System32/lxss/lib/libcuda.so.1"
 "/mnt/c/Windows/System32/lxss/lib/libdxcore.so"
 "/usr/lib/wsl/drivers/nv_dispi.inf_amd64_cc769de64b941e9c/libcuda.so.1.1"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcublas.so.11"
 "/usr/local/cuda/lib64/libcublasLt.so.11"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcusparse.so.11"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcusolver.so.11"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcufft.so.10"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcurand.so.10"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_ops_infer.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_ops_train.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_cnn_infer.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_cnn_train.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_adv_infer.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_adv_train.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn.so.8"
 "/home/clive/.julia/artifacts/ac25f8a4fc72584e696bd007b229fd2921b34062/lib/libcutensor.so.1"
 "/mnt/c/Windows/System32/lxss/lib/libnvidia-ml.so.1"
 "/usr/lib/wsl/drivers/nv_dispi.inf_amd64_cc769de64b941e9c/libnvidia-ml.so.1"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcupti.so.2020.2.1"
 "/usr/lib/x86_64-linux-gnu/libutil.so.1"
maleadt commented 3 years ago

"/usr/local/cuda/lib64/libcublasLt.so.11" being loaded isn't OK, that's probably why @jonathan-laurent has been seeing cublasLt-related symbol errors... What happens if you Libdl.dlopen("/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcublasLt.so.11") before loading CUDA and calling versioninfo()?

cchan commented 3 years ago

It works :)

julia> using Libdl

julia> Libdl.dlopen("/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcublasLt.so.11")
Ptr{Nothing} @0x00000000017f76a0

julia> using CUDA

julia> CUDA.versioninfo()
CUDA toolkit 11.1.1, artifact installation
CUDA driver 11.3.0
NVIDIA driver 465.51.0

Libraries: 
- CUBLAS: 11.3.0
- CURAND: 10.2.2
- CUFFT: 10.3.0
- CUSOLVER: 11.0.1
- CUSPARSE: 11.3.0
- CUPTI: 14.0.0
- NVML: 11.0.0+465.0
- CUDNN: 8.0.4 (for CUDA 11.1.0)
- CUTENSOR: 1.2.1 (for CUDA 11.1.0)

Toolchain:
- Julia: 1.6.0-rc1
- LLVM: 11.0.1
- PTX ISA support: 3.2, 4.0, 4.1, 4.2, 4.3, 5.0, 6.0, 6.1, 6.3, 6.4, 6.5, 7.0
- Device support: sm_35, sm_37, sm_50, sm_52, sm_53, sm_60, sm_61, sm_62, sm_70, sm_72, sm_75, sm_80

1 device:
  0: NVIDIA GeForce RTX 2070 (sm_75, 6.018 GiB / 8.000 GiB available)

julia> show(stdout, "text/plain", Libdl.dllist())
62-element Vector{String}:
 "linux-vdso.so.1"
 "/usr/lib/x86_64-linux-gnu/libdl.so.2"
 "/usr/lib/x86_64-linux-gnu/libpthread.so.0"
 "/usr/lib/x86_64-linux-gnu/libc.so.6"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/libjulia.so.1"
 "/lib64/ld-linux-x86-64.so.2"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libgcc_s.so.1"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libopenlibm.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libjulia-internal.so.1"
 "/usr/lib/x86_64-linux-gnu/libunwind.so.8"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libLLVM-11jl.so"
 "/usr/lib/x86_64-linux-gnu/librt.so.1"
 "/usr/lib/x86_64-linux-gnu/libstdc++.so.6"
 "/usr/lib/x86_64-linux-gnu/libm.so.6"
 "/usr/lib/x86_64-linux-gnu/liblzma.so.5"
 "/home/clive/packages/julias/julia-1.6/lib/julia/sys.so"
 "/usr/lib/x86_64-linux-gnu/libatomic.so.1"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libpcre2-8.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libgmp.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libmpfr.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libopenblas64_.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libgfortran.so.4"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libquadmath.so.0"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libcholmod.so"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libamd.so.2"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libcolamd.so.2"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libsuitesparseconfig.so.5"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libccolamd.so.2"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libcamd.so.2"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libsuitesparse_wrapper.so"
 "/usr/lib/x86_64-linux-gnu/libnghttp2.so.14"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libcurl.so"
 "/usr/lib/x86_64-linux-gnu/libssh2.so.1"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libmbedtls.so.13"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libmbedx509.so.1"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libmbedcrypto.so.5"
 "/usr/lib/x86_64-linux-gnu/libz.so.1"
 "/usr/lib/x86_64-linux-gnu/libgcrypt.so.20"
 "/usr/lib/x86_64-linux-gnu/libgpg-error.so.0"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcublasLt.so.11"
 "/usr/lib/x86_64-linux-gnu/libgomp.so.1"
 "/home/clive/packages/julias/julia-1.6/bin/../lib/julia/libdSFMT.so"
 "/mnt/c/Windows/System32/lxss/lib/libcuda.so.1"
 "/mnt/c/Windows/System32/lxss/lib/libdxcore.so"
 "/usr/lib/wsl/drivers/nv_dispi.inf_amd64_cc769de64b941e9c/libcuda.so.1.1"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcublas.so.11"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcusparse.so.11"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcusolver.so.11"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcufft.so.10"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcurand.so.10"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_ops_infer.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_ops_train.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_cnn_infer.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_cnn_train.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_adv_infer.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn_adv_train.so.8"
 "/home/clive/.julia/artifacts/c1f953962cc13e4a55f7b2333fb212e7f5c08817/lib/libcudnn.so.8"
 "/home/clive/.julia/artifacts/ac25f8a4fc72584e696bd007b229fd2921b34062/lib/libcutensor.so.1"
 "/mnt/c/Windows/System32/lxss/lib/libnvidia-ml.so.1"
 "/usr/lib/wsl/drivers/nv_dispi.inf_amd64_cc769de64b941e9c/libnvidia-ml.so.1"
 "/home/clive/.julia/artifacts/48c41dccb8db0c9aa9483267cb33719207abe4c1/lib/libcupti.so.2020.2.1"
 "/usr/lib/x86_64-linux-gnu/libutil.so.1"

julia> a = CUDA.rand(2,2)
2×2 CuArray{Float32, 2}:
b 0.608778  0.680285
 0.60226   0.923604

julia> b = CUDA.rand(2,2)
2×2 CuArray{Float32, 2}:
 0.40192   0.874944
 0.537889  0.7374

julia> a * b
2×2 CuArray{Float32, 2}:
 0.610598  1.03429
 0.738857  1.20801
maleadt commented 3 years ago

Thanks for the confirmation, I've pushed a similar fix here: https://github.com/JuliaGPU/CUDA.jl/pull/729. Could you please test?

cchan commented 3 years ago

Probably dumb question, but how do I test this at the head of the repo? An update CUDA didn't seem to have an effect.

jonathan-laurent commented 3 years ago

@cchan You probably want to do ]add CUDA#master.

cchan commented 3 years ago

Ah works great now 😋 Specifically, since it seems like 11.2 is now the default if it's available, creating arrays and multiplying on 11.2 works fine by default; besides that switching using ENV to 11.1 also works fine.