// Copyright (C) 2017 Davis E. King ([email protected]) | |
// License: Boost Software License See LICENSE.txt for the full license. | |
namespace dlib | |
{ | |
namespace cuda | |
{ | |
// ----------------------------------------------------------------------------------- | |
class inv : noncopyable | |
{ | |
/*! | |
WHAT THIS OBJECT REPRESENTS | |
This is a functor for doing matrix inversion on the GPU. The only | |
reason it's an object is to avoid the reallocation of some GPU memory | |
blocks if you want to do a bunch of matrix inversions in a row. | |
!*/ | |
public: | |
inv() = default; | |
~inv(); | |
void operator() ( | |
const tensor& m, | |
resizable_tensor& out | |
); | |
/*! | |
requires | |
- m.size() == m.num_samples()*m.num_samples() | |
(i.e. mat(m) must be a square matrix) | |
ensures | |
- out == inv(mat(m)); | |
!*/ | |
int get_last_status( | |
); | |
/*! | |
ensures | |
- returns 0 if the last matrix inversion was successful and != 0 | |
otherwise. | |
!*/ | |
private: | |
void sync_if_needed(); | |
bool did_work_lately = false; | |
resizable_tensor m; | |
cuda_data_ptr<float> workspace; | |
cuda_data_ptr<int> Ipiv; | |
cuda_data_ptr<int> info; | |
}; | |
// ------------------------------------------------------------------------------------ | |
} | |
} | |