monolish  0.17.3-dev.23
MONOlithic LInear equation Solvers for Highly-parallel architecture
monolish_vector.hpp
Go to the documentation of this file.
1 #pragma once
2 #include "./monolish_dense.hpp"
3 #include "./monolish_logger.hpp"
4 #include "./monolish_view1D.hpp"
5 #include <exception>
6 #include <fstream>
7 #include <iostream>
8 #include <iterator>
9 #include <memory>
10 #include <omp.h>
11 #include <stdexcept>
12 #include <string>
13 #include <vector>
14 
15 #if USE_SXAT
16 #undef _HAS_CPP17
17 #endif
18 #include <random>
19 #if USE_SXAT
20 #define _HAS_CPP17 1
21 #endif
22 
23 #if defined USE_MPI
24 #include <mpi.h>
25 #endif
26 
27 namespace monolish {
28 template <typename TYPE, typename Float> class view1D;
29 template <typename TYPE, typename Float> class view_Dense;
30 template <typename TYPE, typename Float> class view_tensor_Dense;
31 
32 namespace tensor {
33 template <typename Float> class tensor_Dense;
34 }
35 
47 template <typename Float> class vector {
48 private:
52  mutable std::shared_ptr<bool> gpu_status = std::make_shared<bool>(false);
53 
57  size_t first = 0;
58 
59 public:
63  std::shared_ptr<Float> val;
64 
68  std::size_t val_nnz = 0;
69 
73  std::size_t alloc_nnz = 0;
74 
78  bool val_create_flag = false;
79 
80  vector() { val_create_flag = true; }
81 
82  // constructor ///////////////////////////////////////////////////////
91  vector(const size_t N);
92 
102  vector(const size_t N, const Float value);
103 
112  vector(const std::vector<Float> &vec);
113 
122  vector(const std::initializer_list<Float> &list);
123 
136  vector(const vector<Float> &vec);
137 
150  vector(const view1D<vector<Float>, Float> &vec);
151 
164  vector(const view1D<matrix::Dense<Float>, Float> &vec);
165 
179 
189  vector(const Float *start, const Float *end);
190 
201  vector(const size_t N, const Float min, const Float max);
202 
215  vector(const size_t N, const Float min, const Float max,
216  const std::uint32_t seed);
217 
225  [[nodiscard]] std::string type() const { return "vector"; }
226 
227  // communication
228  // ///////////////////////////////////////////////////////////////////////////
236  void send() const;
237 
245  void recv();
246 
254  void nonfree_recv();
255 
263  void device_free() const;
264 
273  [[nodiscard]] bool get_device_mem_stat() const { return *gpu_status; }
274 
279  [[nodiscard]] std::shared_ptr<bool> get_gpu_status() const {
280  return gpu_status;
281  }
282 
291  if (val_create_flag) {
292  if (get_device_mem_stat()) {
293  device_free();
294  }
295  }
296  }
297 
298  // util
299  // ///////////////////////////////////////////////////////////////////////////
300 
307  [[nodiscard]] const Float *data() const { return val.get(); }
308 
315  [[nodiscard]] Float *data() { return val.get(); }
316 
323  [[nodiscard]] const Float *begin() const { return data() + get_offset(); }
324 
331  [[nodiscard]] Float *begin() { return data() + get_offset(); }
332 
339  [[nodiscard]] const Float *end() const {
340  return data() + get_offset() + get_nnz();
341  }
342 
349  [[nodiscard]] Float *end() { return data() + get_offset() + get_nnz(); }
350 
357  [[nodiscard]] size_t size() const { return val_nnz; }
358 
366  [[nodiscard]] std::shared_ptr<Float> get_val() { return val; }
367 
374  [[nodiscard]] size_t get_nnz() const { return val_nnz; }
375 
383  [[nodiscard]] size_t get_alloc_nnz() const { return alloc_nnz; }
384 
391  [[nodiscard]] size_t get_first() const { return first; }
392 
399  [[nodiscard]] size_t get_offset() const { return get_first(); }
400 
406  void set_first(size_t i) { first = i; }
407 
416  void fill(Float value);
417 
426  void print_all(bool force_cpu = false) const;
427 
436  void print_all(std::string filename) const;
437 
446  void resize(size_t N, Float Val = 0) {
447  if (get_device_mem_stat()) {
448  throw std::runtime_error("Error, GPU vector cant use resize");
449  }
450  if (val_create_flag) {
451  std::shared_ptr<Float> tmp(new Float[N], std::default_delete<Float[]>());
452  size_t copy_size = std::min(val_nnz, N);
453  for (size_t i = 0; i < copy_size; i++) {
454  tmp.get()[i] = data()[i];
455  }
456  for (size_t i = copy_size; i < N; i++) {
457  tmp.get()[i] = Val;
458  }
459  val = tmp;
460  alloc_nnz = N;
461  val_nnz = N;
462  } else {
463  throw std::runtime_error("Error, not create vector cant use resize");
464  }
465  }
466 
473  void push_back(Float Val) {
474  if (get_device_mem_stat()) {
475  throw std::runtime_error("Error, GPU vector cant use push_back");
476  }
477  if (val_create_flag) {
478  if (val_nnz >= alloc_nnz) {
479  size_t tmp = val_nnz;
480  alloc_nnz = 2 * alloc_nnz + 1;
481  resize(alloc_nnz);
482  val_nnz = tmp;
483  }
484  data()[val_nnz] = Val;
485  val_nnz++;
486  } else {
487  throw std::runtime_error("Error, not create vector cant use push_back");
488  }
489  }
490 
491  void move(const tensor::tensor_Dense<Float> &tensor_dense);
492 
493  void move(const tensor::tensor_Dense<Float> &tensor_dense, int N);
494 
495  void move(const view_tensor_Dense<vector<Float>, Float> &tensor_dense);
496 
497  void move(const view_tensor_Dense<matrix::Dense<Float>, Float> &tensor_dense);
498 
500  &tensor_dense);
501 
502  void move(const view_tensor_Dense<vector<Float>, Float> &tensor_dense, int N);
503 
504  void move(const view_tensor_Dense<matrix::Dense<Float>, Float> &tensor_dense,
505  int N);
506 
507  void move(
508  const view_tensor_Dense<tensor::tensor_Dense<Float>, Float> &tensor_dense,
509  int N);
510 
511  // operator
512  // ///////////////////////////////////////////////////////////////////////////
513 
526  void operator=(const vector<Float> &vec);
527 
540  void operator=(const view1D<vector<Float>, Float> &vec);
541 
554  void operator=(const view1D<matrix::Dense<Float>, Float> &vec);
555 
568  void operator=(const view1D<tensor::tensor_Dense<Float>, Float> &vec);
569 
579  void operator=(const std::vector<Float> &vec);
580 
589  [[nodiscard]] vector<Float> operator-();
590 
600  [[nodiscard]] Float &operator[](size_t i) {
601  if (get_device_mem_stat()) {
602  throw std::runtime_error("Error, GPU vector cant use operator[]");
603  }
604  return data()[first + i];
605  }
606 
617  bool equal(const vector<Float> &vec,
618  bool compare_cpu_and_device = false) const;
619 
630  bool equal(const view1D<vector<Float>, Float> &vec,
631  bool compare_cpu_and_device = false) const;
632 
643  bool equal(const view1D<matrix::Dense<Float>, Float> &vec,
644  bool compare_cpu_and_device = false) const;
645 
656  bool equal(const view1D<tensor::tensor_Dense<Float>, Float> &vec,
657  bool compare_cpu_and_device = false) const;
658 
670  bool operator==(const vector<Float> &vec) const;
671 
683  bool operator==(const view1D<vector<Float>, Float> &vec) const;
684 
696  bool operator==(const view1D<matrix::Dense<Float>, Float> &vec) const;
697 
709  bool operator==(const view1D<tensor::tensor_Dense<Float>, Float> &vec) const;
710 
722  bool operator!=(const vector<Float> &vec) const;
723 
735  bool operator!=(const view1D<vector<Float>, Float> &vec) const;
736 
748  bool operator!=(const view1D<matrix::Dense<Float>, Float> &vec) const;
749 
761  bool operator!=(const view1D<tensor::tensor_Dense<Float>, Float> &vec) const;
762 };
764 } // namespace monolish
Dense format Matrix.
vector(const view1D< matrix::Dense< Float >, Float > &vec)
copy from monolish::view1D from monolish::matrix::Dense
void set_first(size_t i)
change first position
void send() const
send data to GPU
Float & operator[](size_t i)
reference to the element at position (v[i])
vector(const size_t N, const Float min, const Float max, const std::uint32_t seed)
create N length rand(min~max) vector with random seed
void operator=(const std::vector< Float > &vec)
copy vector from std::vector
void resize(size_t N, Float Val=0)
resize vector (only CPU)
void move(const view_tensor_Dense< tensor::tensor_Dense< Float >, Float > &tensor_dense, int N)
vector(const std::vector< Float > &vec)
copy from std::vector
void operator=(const vector< Float > &vec)
copy vector, It is same as copy ( Copy the memory on CPU and GPU )
void move(const tensor::tensor_Dense< Float > &tensor_dense, int N)
void move(const view_tensor_Dense< vector< Float >, Float > &tensor_dense)
bool operator!=(const vector< Float > &vec) const
Comparing vectors (v != vec)
void move(const tensor::tensor_Dense< Float > &tensor_dense)
bool operator==(const view1D< vector< Float >, Float > &vec) const
Comparing vectors (v == vec)
void recv()
recv data from GPU, and free data on GPU
void operator=(const view1D< tensor::tensor_Dense< Float >, Float > &vec)
copy vector, It is same as copy ( Copy the memory on CPU and GPU )
const Float * data() const
returns a direct pointer to the vector
std::shared_ptr< Float > val
vector data (pointer)
void move(const view_tensor_Dense< matrix::Dense< Float >, Float > &tensor_dense, int N)
void move(const view_tensor_Dense< matrix::Dense< Float >, Float > &tensor_dense)
void fill(Float value)
fill vector elements with a scalar value
const Float * end() const
returns a end iterator
void operator=(const view1D< matrix::Dense< Float >, Float > &vec)
copy vector, It is same as copy ( Copy the memory on CPU and GPU )
vector(const std::initializer_list< Float > &list)
copy from initializer_list
bool operator==(const view1D< tensor::tensor_Dense< Float >, Float > &vec) const
Comparing vectors (v == vec)
size_t size() const
get vector size
bool operator==(const view1D< matrix::Dense< Float >, Float > &vec) const
Comparing vectors (v == vec)
bool operator!=(const view1D< tensor::tensor_Dense< Float >, Float > &vec) const
Comparing vectors (v != vec)
std::string type() const
get format name "vector"
void move(const view_tensor_Dense< vector< Float >, Float > &tensor_dense, int N)
size_t get_first() const
get first position
size_t get_offset() const
get first position (same as get_first())
Float * end()
returns a end iterator
vector(const view1D< tensor::tensor_Dense< Float >, Float > &vec)
copy from monolish::view1D from monolish::tensor::tensor_Dense
bool val_create_flag
vector create flag;
vector< Float > operator-()
Sign inversion.
vector(const size_t N)
allocate size N vector
vector(const vector< Float > &vec)
copy from monolish::vector
std::shared_ptr< Float > get_val()
get shared_ptr of val
std::size_t val_nnz
vector size
bool equal(const view1D< tensor::tensor_Dense< Float >, Float > &vec, bool compare_cpu_and_device=false) const
Comparing matrices (A == mat)
vector(const Float *start, const Float *end)
copy from pointer
size_t first
first position of data array
Float * begin()
returns a begin iterator
Float * data()
returns a direct pointer to the vector
void push_back(Float Val)
Add a new element at the end of the vector (only CPU)
void nonfree_recv()
recv data from GPU (w/o free)
vector(const size_t N, const Float min, const Float max)
create N length rand(min~max) vector
bool equal(const view1D< vector< Float >, Float > &vec, bool compare_cpu_and_device=false) const
Comparing matrices (A == mat)
void print_all(std::string filename) const
print all elements to file
~vector()
destructor of vector, free GPU memory
vector(const view1D< vector< Float >, Float > &vec)
copy from monolish::view1D from vector
bool operator==(const vector< Float > &vec) const
Comparing vectors (v == vec)
void print_all(bool force_cpu=false) const
print all elements to standart I/O
bool equal(const view1D< matrix::Dense< Float >, Float > &vec, bool compare_cpu_and_device=false) const
Comparing matrices (A == mat)
void operator=(const view1D< vector< Float >, Float > &vec)
copy vector, It is same as copy ( Copy the memory on CPU and GPU )
const Float * begin() const
returns a begin iterator
bool get_device_mem_stat() const
true: sended, false: not send
std::shared_ptr< bool > get_gpu_status() const
gpu status shared pointer
std::size_t alloc_nnz
alloced vector size
size_t get_alloc_nnz() const
get # of alloced non-zeros
void move(const view_tensor_Dense< tensor::tensor_Dense< Float >, Float > &tensor_dense)
bool equal(const vector< Float > &vec, bool compare_cpu_and_device=false) const
Comparing matrices (A == mat)
bool operator!=(const view1D< vector< Float >, Float > &vec) const
Comparing vectors (v != vec)
void device_free() const
free data on GPU
bool operator!=(const view1D< matrix::Dense< Float >, Float > &vec) const
Comparing vectors (v != vec)
std::shared_ptr< bool > gpu_status
true: sended, false: not send
vector(const size_t N, const Float value)
initialize size N vector, value to fill the container
size_t get_nnz() const
get vector size
void max(const matrix::CRS< double > &A, const matrix::CRS< double > &B, matrix::CRS< double > &C)
Create a new CRS matrix with greatest elements of two matrices (C[0:nnz] = max(A[0:nnz],...
void min(const matrix::CRS< double > &A, const matrix::CRS< double > &B, matrix::CRS< double > &C)
Create a new CRS matrix with smallest elements of two matrices (C[0:nnz] = min(A[0:nnz],...
monolish namespaces