monolish  0.17.3-dev.23
MONOlithic LInear equation Solvers for Highly-parallel architecture
monolish_tensor_dense.hpp
Go to the documentation of this file.
1 #pragma once
2 #include "monolish_matrix.hpp"
3 #include "monolish_tensor.hpp"
4 #include "monolish_vector.hpp"
5 
6 namespace monolish {
7 template <typename Float> class vector;
8 template <typename TYPE, typename Float> class view1D;
9 template <typename TYPE, typename Float> class view_Dense;
10 template <typename TYPE, typename Float> class view_tensor_Dense;
11 namespace tensor {
12 template <typename Float> class tensor_COO;
13 template <typename Float> class tensor_Dense {
14 private:
18  std::vector<size_t> shape;
19 
23  mutable std::shared_ptr<bool> gpu_status = std::make_shared<bool>(false);
24 
28  size_t first = 0;
29 
30 public:
34  std::shared_ptr<Float> val;
35 
39  size_t val_nnz = 0;
40 
44  size_t alloc_nnz = 0;
45 
49  bool val_create_flag = false;
50 
52 
62 
76 
86 
96  convert(tens);
97  val_create_flag = true;
98  }
99 
107  void convert(const matrix::Dense<Float> &dense);
108 
117  convert(dense);
118  val_create_flag = true;
119  }
120 
128  void convert(const vector<Float> &vec);
129 
138  convert(vec);
139  val_create_flag = true;
140  }
141 
150  tensor_Dense(const std::vector<size_t> &shape);
151 
160  tensor_Dense(const std::initializer_list<size_t> &shape);
161 
170  tensor_Dense(const std::vector<size_t> &shape, const Float *value);
171 
181  tensor_Dense(const std::vector<size_t> &shape,
182  const std::vector<Float> &value);
183 
194  tensor_Dense(const std::vector<size_t> &shape, const Float min,
195  const Float max);
196 
208  tensor_Dense(const std::vector<size_t> &shape, const Float min,
209  const Float max, const std::uint32_t seed);
210 
224  tensor_Dense(const tensor_Dense<Float> &tens, Float value);
225 
239 
253 
267  const view_tensor_Dense<tensor::tensor_Dense<Float>, Float> &tens);
268 
278  void set_ptr(const std::vector<size_t> &shape,
279  const std::vector<Float> &value);
280 
290  void set_ptr(const std::vector<size_t> &shape, const Float *value);
291 
301  void set_ptr(const std::vector<size_t> &shape, const Float value);
302 
310  [[nodiscard]] std::vector<size_t> get_shape() const { return shape; }
311 
319  [[nodiscard]] std::shared_ptr<Float> get_val() { return val; }
320 
328  [[nodiscard]] size_t get_nnz() const { return val_nnz; }
329 
337  [[nodiscard]] size_t get_alloc_nnz() const { return alloc_nnz; }
338 
345  [[nodiscard]] size_t get_first() const { return first; }
346 
353  [[nodiscard]] size_t get_offset() const { return get_first(); }
354 
362  void set_shape(const std::vector<size_t> &shape) { this->shape = shape; };
363 
371  // void set_nnz(const size_t NZ) { val_nnz = NZ; };
372 
378  void set_first(size_t i) { first = i; }
379 
387  [[nodiscard]] std::string type() const { return "tensor_Dense"; }
388 
389  // TODO
397  [[nodiscard]] double get_data_size() const {
398  return get_nnz() * sizeof(Float) / 1.0e+9;
399  }
400 
410  [[nodiscard]] Float at(const size_t pos) const;
411 
421  [[nodiscard]] Float at(const std::vector<size_t> &pos) const;
422 
432  template <typename... Args>
433  [[nodiscard]] Float at(const std::vector<size_t> &pos, const size_t dim,
434  const Args... args) const {
435  std::vector<size_t> pos_copy = pos;
436  pos_copy.push_back(dim);
437  return this->at(pos_copy, args...);
438  };
439 
449  template <typename... Args>
450 #if !defined(__clang__) && defined(__GNUC__)
451  [[nodiscard]] Float at(const size_t dim, const size_t dim2,
452  const Args... args) const {
453  std::vector<size_t> pos(1);
454  pos[0] = dim;
455  return this->at(pos, dim2, args...);
456  };
457 #else
458  [[nodiscard]] Float at(const size_t dim, const Args... args) const {
459  std::vector<size_t> pos(1);
460  pos[0] = dim;
461  return this->at(pos, args...);
462  };
463 #endif
464 
474  [[nodiscard]] Float at(const size_t pos) {
475  return static_cast<const tensor_Dense *>(this)->at(pos);
476  };
477 
487  [[nodiscard]] Float at(const std::vector<size_t> &pos) {
488  return static_cast<const tensor_Dense *>(this)->at(pos);
489  };
490 
500  template <typename... Args>
501  [[nodiscard]] Float at(const std::vector<size_t> &pos, const Args... args) {
502  return static_cast<const tensor_Dense *>(this)->at(pos, args...);
503  };
504 
514  template <typename... Args>
515  [[nodiscard]] Float at(const size_t dim, const Args... args) {
516  return static_cast<const tensor_Dense *>(this)->at(dim, args...);
517  };
518 
528  void insert(const size_t pos, const Float Val);
529 
539  void insert(const std::vector<size_t> &pos, const Float Val);
540 
549  void print_all(bool force_cpu = false) const;
550 
551  // communication
552  // ///////////////////////////////////////////////////////////////////////////
560  void send() const;
561 
569  void recv();
570 
578  void nonfree_recv();
579 
587  void device_free() const;
588 
593  [[nodiscard]] bool get_device_mem_stat() const { return *gpu_status; }
594 
599  [[nodiscard]] std::shared_ptr<bool> get_gpu_status() const {
600  return gpu_status;
601  }
602 
611  if (val_create_flag) {
612  if (get_device_mem_stat()) {
613  device_free();
614  }
615  }
616  }
617 
624  [[nodiscard]] const Float *data() const { return val.get(); }
625 
632  [[nodiscard]] Float *data() { return val.get(); }
633 
642  void resize(const size_t N, Float Val = 0) {
643  if (first + N < alloc_nnz) {
644  for (size_t i = val_nnz; i < N; ++i) {
645  begin()[i] = Val;
646  }
647  val_nnz = N;
648  return;
649  }
650  if (get_device_mem_stat()) {
651  throw std::runtime_error("Error, GPU matrix cant use resize");
652  }
653  if (val_create_flag) {
654  std::shared_ptr<Float> tmp(new Float[N], std::default_delete<Float[]>());
655  size_t copy_size = std::min(val_nnz, N);
656  for (size_t i = 0; i < copy_size; ++i) {
657  tmp.get()[i] = data()[i];
658  }
659  for (size_t i = copy_size; i < N; ++i) {
660  tmp.get()[i] = Val;
661  }
662  val = tmp;
663  alloc_nnz = N;
664  val_nnz = N;
665  first = 0;
666  } else {
667  throw std::runtime_error("Error, not create vector cant use resize");
668  }
669  }
670 
679  void resize(const std::vector<size_t> &shape, Float val = 0) {
680  size_t N = 1;
681  for (auto n : shape) {
682  N *= n;
683  }
684  resize(N, val);
685  this->shape = shape;
686  }
687 
693  void move(const matrix::Dense<Float> &dense);
694 
700  void move(const vector<Float> &vec);
701 
708  [[nodiscard]] const Float *begin() const { return data() + get_offset(); }
709 
716  [[nodiscard]] Float *begin() { return data() + get_offset(); }
717 
724  [[nodiscard]] const Float *end() const {
725  return data() + get_offset() + get_nnz();
726  }
727 
734  [[nodiscard]] Float *end() { return data() + get_offset() + get_nnz(); }
735 
744  void fill(Float value);
745 
758  void operator=(const tensor_Dense<Float> &tens);
759 
772  void operator=(const view_tensor_Dense<vector<Float>, Float> &tens);
773 
787 
800  void
802 
812  [[nodiscard]] Float &operator[](size_t i) {
813  if (get_device_mem_stat()) {
814  throw std::runtime_error("Error, GPU vector cant use operator[]");
815  }
816  return data()[first + i];
817  }
818 
829  [[nodiscard]] bool equal(const tensor_Dense<Float> &tens,
830  bool compare_cpu_and_device = false) const;
831 
843  [[nodiscard]] bool operator==(const tensor_Dense<Float> &tens) const;
844 
856  [[nodiscard]] bool operator!=(const tensor_Dense<Float> &tens) const;
857 
867  size_t get_index(const std::vector<size_t> &pos) const {
868  if (pos.size() != this->shape.size()) {
869  throw std::runtime_error("pos size should be same with the shape");
870  }
871  size_t ind = 0;
872  for (auto i = 0; i < pos.size(); ++i) {
873  ind *= this->shape[i];
874  ind += pos[i];
875  }
876  return ind;
877  }
878 
888  std::vector<size_t> get_index(const size_t pos) const {
889  std::vector<size_t> ind(this->shape.size(), 0);
890  auto pos_copy = pos;
891  for (int i = (int)this->shape.size() - 1; i >= 0; --i) {
892  ind[i] = pos_copy % this->shape[i];
893  pos_copy /= this->shape[i];
894  }
895  return ind;
896  }
897 
906  void reshape(const std::vector<int> &shape);
907 
916  template <typename... Args>
917  void reshape(const std::vector<int> &shape, const size_t dim,
918  const Args... args) {
919  std::vector<int> shape_copy = shape;
920  shape_copy.push_back(dim);
921  reshape(shape_copy, args...);
922  return;
923  }
924 
933  template <typename... Args> void reshape(const int dim, const Args... args) {
934  std::vector<int> shape(1);
935  shape[0] = dim;
936  reshape(shape, args...);
937  return;
938  }
939 
941 
950  void diag_add(const Float alpha);
951 
960  void diag_sub(const Float alpha);
961 
970  void diag_mul(const Float alpha);
971 
980  void diag_div(const Float alpha);
981 
990  void diag_add(const vector<Float> &vec);
991  void diag_add(const view1D<vector<Float>, Float> &vec);
992  void diag_add(const view1D<matrix::Dense<Float>, Float> &vec);
993  void diag_add(const view1D<tensor::tensor_Dense<Float>, Float> &vec);
994 
1003  void diag_sub(const vector<Float> &vec);
1004  void diag_sub(const view1D<vector<Float>, Float> &vec);
1005  void diag_sub(const view1D<matrix::Dense<Float>, Float> &vec);
1006  void diag_sub(const view1D<tensor::tensor_Dense<Float>, Float> &vec);
1007 
1016  void diag_mul(const vector<Float> &vec);
1017  void diag_mul(const view1D<vector<Float>, Float> &vec);
1018  void diag_mul(const view1D<matrix::Dense<Float>, Float> &vec);
1019  void diag_mul(const view1D<tensor::tensor_Dense<Float>, Float> &vec);
1020 
1029  void diag_div(const vector<Float> &vec);
1030  void diag_div(const view1D<vector<Float>, Float> &vec);
1031  void diag_div(const view1D<matrix::Dense<Float>, Float> &vec);
1032  void diag_div(const view1D<tensor::tensor_Dense<Float>, Float> &vec);
1033 };
1034 } // namespace tensor
1035 } // namespace monolish
Dense format Matrix.
void reshape(const std::vector< int > &shape)
Reshape tensor.
bool equal(const tensor_Dense< Float > &tens, bool compare_cpu_and_device=false) const
Comparing tensors (A == tens)
void reshape(const std::vector< int > &shape, const size_t dim, const Args... args)
Reshape tensor.
std::vector< size_t > get_index(const size_t pos) const
get vector index from aligned index (A[pos[0]][pos[1]]... = A[ind])
std::string type() const
get format name "tensor_Dense"
void diag_mul(const vector< Float > &vec)
Vector and diag. vector of Dense format matrix mul.
size_t get_index(const std::vector< size_t > &pos) const
get aligned index from vector index (A[pos] = A[ind[0]][ind[1]]...)
void convert(const matrix::Dense< Float > &dense)
create tensor_Dense tensor from Dense matrix
void diag_add(const view1D< matrix::Dense< Float >, Float > &vec)
tensor_Dense(const std::initializer_list< size_t > &shape)
Allocate dense tensor.
size_t get_first() const
get first position
bool operator!=(const tensor_Dense< Float > &tens) const
Comparing tensors (A != tens)
void diag_div(const view1D< tensor::tensor_Dense< Float >, Float > &vec)
tensor_Dense(const view_tensor_Dense< vector< Float >, Float > &tens)
Create Dense matrix from view Dense matrix.
void operator=(const view_tensor_Dense< tensor::tensor_Dense< Float >, Float > &tens)
tensor copy
std::vector< size_t > shape
shape
tensor_Dense(const std::vector< size_t > &shape, const std::vector< Float > &value)
Allocate tensor_Dense tensor.
void set_ptr(const std::vector< size_t > &shape, const Float value)
Set tensor_Dense array from array.
std::shared_ptr< Float > val
Dense tensor format value (pointer)
Float at(const std::vector< size_t > &pos, const Args... args)
get element A[pos[0]][pos[1]]... (onlu CPU)
void insert(const size_t pos, const Float Val)
set element A[index]...
Float at(const std::vector< size_t > &pos)
get element A[pos[0]][pos[1]]... (onlu CPU)
void operator=(const view_tensor_Dense< matrix::Dense< Float >, Float > &tens)
tensor copy
void diag_add(const Float alpha)
Scalar and diag. vector of Dense format matrix add.
void insert(const std::vector< size_t > &pos, const Float Val)
set element A[pos[0]][pos[1]]...
void recv()
recv. data to GPU, and free data on GPU
void send() const
send data to GPU
void diag_sub(const view1D< tensor::tensor_Dense< Float >, Float > &vec)
void diag_sub(const view1D< matrix::Dense< Float >, Float > &vec)
size_t val_nnz
# of non-zero element (M * N)
tensor_Dense(const matrix::Dense< Float > &dense)
Create tensor_Dense tensor from Dense matrix.
void diag_add(const view1D< vector< Float >, Float > &vec)
std::vector< size_t > get_shape() const
get shape
void diag_add(const view1D< tensor::tensor_Dense< Float >, Float > &vec)
void print_all(bool force_cpu=false) const
print all elements to standard I/O
void diag_sub(const view1D< vector< Float >, Float > &vec)
size_t alloc_nnz
allocated tensor size
void resize(const std::vector< size_t > &shape, Float val=0)
resize tensor value
void fill(Float value)
fill tensor elements with a scalar value
Float at(const size_t dim, const Args... args) const
get element A[pos[0]][pos[1]]...
size_t first
first position of data array
std::shared_ptr< bool > gpu_status
true: sended, false: not send
tensor_Dense(const tensor::tensor_Dense< Float > &tens)
Create tensor_Dense tensor from tensor_Dense tensor.
Float at(const std::vector< size_t > &pos) const
get element A[pos[0]][pos[1]]...
void move(const matrix::Dense< Float > &dense)
move tensor_Dense tensor from Dense matrix
std::shared_ptr< Float > get_val()
get shared_ptr of val
Float * end()
returns a end iterator
void diag_div(const view1D< matrix::Dense< Float >, Float > &vec)
void diag_add(const vector< Float > &vec)
Vector and diag. vector of Dense format matrix add.
Float * data()
returns a direct pointer to the tensor
void diag_mul(const view1D< tensor::tensor_Dense< Float >, Float > &vec)
void nonfree_recv()
recv. data to GPU (w/o free)
void diag_mul(const view1D< matrix::Dense< Float >, Float > &vec)
const Float * data() const
returns a direct pointer to the tensor
Float at(const size_t pos)
get element A[index]... (onlu CPU)
Float at(const std::vector< size_t > &pos, const size_t dim, const Args... args) const
get element A[pos[0]][pos[1]]...
void set_shape(const std::vector< size_t > &shape)
Set shape.
tensor_Dense(const std::vector< size_t > &shape, const Float min, const Float max)
Allocate tensor_Dense tensor.
const Float * end() const
returns a end iterator
bool val_create_flag
tensor create flag
void diag_div(const Float alpha)
Scalar and diag. vector of Dense format matrix div.
void set_first(size_t i)
Set # of non-zero elements.
size_t get_alloc_nnz() const
get # of alloced non-zeros
void move(const vector< Float > &vec)
move tensor_Dense tensor from vector
void convert(const tensor::tensor_COO< Float > &tens)
Create tensor_Dense tensor from tensor_COO tensor.
size_t get_nnz() const
get # of non-zeros
tensor_Dense(const std::vector< size_t > &shape, const Float min, const Float max, const std::uint32_t seed)
Allocate tensor_Dense tensor.
void diag_sub(const vector< Float > &vec)
Vector and diag. vector of Dense format matrix sub.
tensor_Dense(const view_tensor_Dense< tensor::tensor_Dense< Float >, Float > &tens)
Create Dense matrix from view Dense matrix.
const Float * begin() const
returns a begin iterator
tensor_Dense(const std::vector< size_t > &shape, const Float *value)
Allocate dense tensor.
Float & operator[](size_t i)
reference to the element at position (v[i])
tensor_Dense(const view_tensor_Dense< matrix::Dense< Float >, Float > &tens)
Create Dense matrix from view Dense matrix.
void diag_sub(const Float alpha)
Scalar and diag. vector of Dense format matrix sub.
tensor_Dense(const tensor::tensor_COO< Float > &tens)
Create tensor_Dense tensor from tensor_COO tensor.
tensor_Dense(const vector< Float > &vec)
create tensor_Dense tensor from vector
void convert(const vector< Float > &vec)
create tensor_Dense tensor from vector
void set_ptr(const std::vector< size_t > &shape, const Float *value)
Set tensor_Dense array from array.
void operator=(const tensor_Dense< Float > &tens)
tensor copy
void device_free() const
free data on GPU
Float at(const size_t dim, const Args... args)
get element A[pos[0]][pos[1]]... (onlu CPU)
void set_ptr(const std::vector< size_t > &shape, const std::vector< Float > &value)
Set tensor_Dense array from std::vector.
void reshape(const int dim, const Args... args)
Reshape tensor.
Float * begin()
returns a begin iterator
Float at(const size_t pos) const
get element A[index]...
double get_data_size() const
Memory data space required by the matrix.
void resize(const size_t N, Float Val=0)
resize tensor value
~tensor_Dense()
destructor of dense tensor, free GPU memory
std::shared_ptr< bool > get_gpu_status() const
gpu status shared pointer
tensor_Dense(const tensor_Dense< Float > &tens, Float value)
Create tensor_Dense tensor of the same size as input tensor.
void diag_mul(const Float alpha)
Scalar and diag. vector of Dense format matrix mul.
void diag_div(const view1D< vector< Float >, Float > &vec)
void operator=(const view_tensor_Dense< vector< Float >, Float > &tens)
tensor copy
bool operator==(const tensor_Dense< Float > &tens) const
Comparing tensors (A == tens)
void diag_div(const vector< Float > &vec)
Vector and diag. vector of Dense format matrix div.
bool get_device_mem_stat() const
true: sended, false: not send
size_t get_offset() const
get first position (same as get_first())
tensor_Dense(const std::vector< size_t > &shape)
Allocate dense tensor.
void diag_mul(const view1D< vector< Float >, Float > &vec)
void convert(const tensor::tensor_Dense< Float > &tens)
Create tensor_Dense tensor from tensor_Dense tensor.
void max(const matrix::CRS< double > &A, const matrix::CRS< double > &B, matrix::CRS< double > &C)
Create a new CRS matrix with greatest elements of two matrices (C[0:nnz] = max(A[0:nnz],...
void min(const matrix::CRS< double > &A, const matrix::CRS< double > &B, matrix::CRS< double > &C)
Create a new CRS matrix with smallest elements of two matrices (C[0:nnz] = min(A[0:nnz],...
monolish namespaces