/external/tensorflow/tensorflow/stream_executor/ |
blas.cc | 16 #include "tensorflow/stream_executor/blas.h" 22 namespace blas { namespace in namespace:perftools::gputools 91 } // namespace blas
|
plugin.h | 51 // described therein will be used to provide BLAS, DNN, FFT, and RNG 72 PluginConfig& SetBlas(PluginId blas); 77 PluginId blas() const { return blas_; } function in class:perftools::gputools::PluginConfig
|
plugin_registry.h | 21 #include "tensorflow/stream_executor/blas.h" 40 // BLAS, DNN, FFT, and RNG. Each interface is defined in the corresponding 53 typedef blas::BlasSupport* (*BlasFactory)(internal::StreamExecutorInterface*); 107 std::map<PluginId, BlasFactory> blas; member in struct:perftools::gputools::PluginRegistry::PluginFactories 117 PluginId blas, dnn, fft, rng; member in struct:perftools::gputools::PluginRegistry::DefaultFactories
|
blas.h | 16 // Exposes the family of BLAS routines as pre-canned high performance calls for 22 // This abstraction makes it simple to entrain BLAS operations on GPU data into 37 // kernel launches (via StreamExecutor::ThenLaunch()) with these pre-canned BLAS 61 namespace blas { namespace in namespace:perftools::gputools 64 // transposed+conjugated before any BLAS operations. 90 // Type with which intermediate computations of a blas routine are performed. 92 // Some blas calls can perform computations with a type that's different than 107 // Opaque identifier for an "algorithm" used by a blas routine. This functions 108 // as a hint to the blas library. 115 // blas uses -1 to represent the default algorithm. This happens to match u [all...] |
/cts/tests/tests/rsblas/src/android/renderscript/cts/ |
BNNMTest.java | 145 ScriptIntrinsicBLAS blas = ScriptIntrinsicBLAS.create(mRS); local 146 blas.BNNM(A, a_offset, B, b_offset, C, c_offset, c_mult_int); 463 ScriptIntrinsicBLAS blas = ScriptIntrinsicBLAS.create(mRS); local 467 blas.BNNM(A, a_offset, B, b_offset, C, c_offset, c_mult_int); 474 blas.BNNM(A, a_offset, B, b_offset, C, c_offset, c_mult_int); 481 blas.BNNM(A, a_offset, B, b_offset, C, c_offset, c_mult_int); 488 blas.BNNM(A, a_offset, B, b_offset, C, c_offset, c_mult_int); 495 blas.BNNM(A, a_offset, B, b_offset, C, c_offset, c_mult_int);
|