18#ifndef TRIPLET_FORM_HPP
19#define TRIPLET_FORM_HPP
24template<sp_d data_t, sp_i index_t>
class csc_form;
25template<sp_d data_t, sp_i index_t>
class csr_form;
33 const index_t*
const row_idx;
34 const index_t*
const col_idx;
37 csr_comparator(
const index_t*
const in_row_idx,
const index_t*
const in_col_idx)
39 , col_idx(in_col_idx) {}
41 bool operator()(
const index_t idx_a,
const index_t idx_b)
const {
42 if(row_idx[idx_a] == row_idx[idx_b])
return col_idx[idx_a] < col_idx[idx_b];
43 return row_idx[idx_a] < row_idx[idx_b];
48 const index_t*
const row_idx;
49 const index_t*
const col_idx;
52 csc_comparator(
const index_t*
const in_row_idx,
const index_t*
const in_col_idx)
54 , col_idx(in_col_idx) {}
56 bool operator()(
const index_t idx_a,
const index_t idx_b)
const {
57 if(col_idx[idx_a] == col_idx[idx_b])
return row_idx[idx_a] < row_idx[idx_b];
58 return col_idx[idx_a] < col_idx[idx_b];
63 const data_t bin = data_t(0);
65 using index_ptr = std::unique_ptr<index_t[]>;
66 using data_ptr = std::unique_ptr<data_t[]>;
68 index_ptr row_idx =
nullptr;
69 index_ptr col_idx =
nullptr;
70 data_ptr val_idx =
nullptr;
72 bool csc_sorted =
false;
73 bool csr_sorted =
false;
75 template<sp_d in_dt, sp_i in_it>
void copy_to(
const std::unique_ptr<in_it[]>& new_row_idx,
const std::unique_ptr<in_it[]>& new_col_idx,
const std::unique_ptr<in_dt[]>& new_val_idx,
const index_t
begin,
const index_t row_offset,
const index_t col_offset,
const data_t scalar)
const { copy_to(new_row_idx.get(), new_col_idx.get(), new_val_idx.get(),
begin, row_offset, col_offset, scalar); }
77 template<sp_d in_dt, sp_i in_it>
void copy_to(in_it*
const new_row_idx, in_it*
const new_col_idx, in_dt*
const new_val_idx,
const index_t
begin,
const index_t row_offset,
const index_t col_offset,
const data_t scalar)
const {
79 new_row_idx[I +
begin] = in_it(row_idx[I] + row_offset);
80 new_col_idx[I +
begin] = in_it(col_idx[I] + col_offset);
81 new_val_idx[I +
begin] = in_dt(scalar * val_idx[I]);
88 void reserve(
const index_t in_elem) {
91 access::rw(
n_alloc) = index_t(std::pow(2., std::ceil(std::log2(in_elem)) + 1));
93 index_ptr new_row_idx(
new index_t[
n_alloc]);
94 index_ptr new_col_idx(
new index_t[
n_alloc]);
95 data_ptr new_val_idx(
new data_t[
n_alloc]);
97 copy_to(new_row_idx, new_col_idx, new_val_idx, 0, 0, 0, 1);
99 row_idx = std::move(new_row_idx);
100 col_idx = std::move(new_col_idx);
101 val_idx = std::move(new_val_idx);
104 void invalidate_sorting_flag() { csc_sorted = csr_sorted =
false; }
106 void condense(
bool =
false);
108 void populate_diagonal() {
114 val_idx[
n_elem + I] = data_t(0);
116 access::rw(
n_elem) += t_elem;
117 invalidate_sorting_flag();
124 template<sp_d in_dt, sp_i in_it>
friend class csc_form;
125 template<sp_d in_dt, sp_i in_it>
friend class csr_form;
140 triplet_form(const index_t in_rows, const index_t in_cols, const index_t in_elem = index_t(0))
150 [[nodiscard]]
const index_t*
row_mem()
const {
return row_idx.get(); }
152 [[nodiscard]]
const index_t*
col_mem()
const {
return col_idx.get(); }
154 [[nodiscard]]
const data_t*
val_mem()
const {
return val_idx.get(); }
156 [[nodiscard]] index_t*
row_mem() {
return row_idx.get(); }
158 [[nodiscard]] index_t*
col_mem() {
return col_idx.get(); }
160 [[nodiscard]] data_t*
val_mem() {
return val_idx.get(); }
162 [[nodiscard]] index_t
row(
const index_t I)
const {
return row_idx[I]; }
164 [[nodiscard]] index_t
col(
const index_t I)
const {
return col_idx[I]; }
166 [[nodiscard]] data_t
val(
const index_t I)
const {
return val_idx[I]; }
174 [[nodiscard]] data_t
max()
const {
181 invalidate_sorting_flag();
184 void init(
const index_t in_elem) {
189 void init(
const index_t in_rows,
const index_t in_cols,
const index_t in_elem) {
190 access::rw(
n_rows) = in_rows;
191 access::rw(
n_cols) = in_cols;
196 for(index_t I = 0; I <
n_elem; ++I)
197 if(
row == row_idx[I] &&
col == col_idx[I])
return val_idx[I];
198 return access::rw(bin) = 0.;
201 data_t&
at(index_t, index_t);
223 access::rw(
n_elem) = in_elem;
228 void save(
const std::string&)
const;
255 void assemble(
const Mat<data_t>&,
const Col<uword>&);
258 template<sp_d in_dt, sp_i in_it>
void assemble(
const triplet_form<in_dt, in_it>& in_mat,
const std::vector<index_t>& row_shift,
const std::vector<index_t>& col_shift,
const std::vector<data_t>& scalar) {
259 suanpan_assert([&] {
if(scalar.size() != row_shift.size() || scalar.size() != col_shift.size())
throw std::invalid_argument(
"size mismatch detected"); });
261 reserve(
n_elem + index_t(scalar.size()) * index_t(in_mat.
n_elem));
263 for(
size_t I = 0; I < scalar.size(); ++I)
assemble(in_mat, row_shift[I], col_shift[I], scalar[I]);
266 Mat<data_t>
operator*(
const Col<data_t>& in_mat)
const {
267 Mat<data_t> out_mat(in_mat.n_rows, in_mat.n_cols, fill::zeros);
269 for(index_t I = 0; I <
n_elem; ++I) out_mat(row_idx[I]) += val_idx[I] * in_mat(col_idx[I]);
274 Mat<data_t>
operator*(
const Mat<data_t>& in_mat)
const {
275 Mat<data_t> out_mat(in_mat.n_rows, in_mat.n_cols, fill::zeros);
277 for(index_t I = 0; I <
n_elem; ++I) out_mat.row(row_idx[I]) += val_idx[I] * in_mat.row(col_idx[I]);
290 return copy += in_mat;
296 return copy -= in_mat;
302 [[nodiscard]] Col<data_t>
diag()
const;
313 auto last_row = row_idx[0], last_col = col_idx[0];
315 sp_i auto current_pos = index_t(0);
316 sp_d auto last_sum = data_t(0);
318 auto populate = [&] {
320 row_idx[current_pos] = last_row;
321 col_idx[current_pos] = last_col;
322 val_idx[current_pos] = last_sum;
324 last_sum = data_t(0);
327 for(index_t I = 0; I <
n_elem; ++I) {
328 if(last_row != row_idx[I] || last_col != col_idx[I]) {
330 last_row = row_idx[I];
331 last_col = col_idx[I];
333 last_sum += val_idx[I];
338 access::rw(
n_elem) = current_pos;
342 : csc_sorted{in_mat.csc_sorted}
343 , csr_sorted{in_mat.csr_sorted}
347 in_mat.copy_to(row_idx, col_idx, val_idx, 0, 0, 0, 1);
352 : row_idx{std::move(in_mat.row_idx)}
353 , col_idx{std::move(in_mat.col_idx)}
354 , val_idx{std::move(in_mat.val_idx)}
355 , csc_sorted{in_mat.csc_sorted}
356 , csr_sorted{in_mat.csr_sorted}
363 if(
this == &in_mat)
return *
this;
364 csc_sorted = in_mat.csc_sorted;
365 csr_sorted = in_mat.csr_sorted;
369 in_mat.copy_to(row_idx, col_idx, val_idx, 0, 0, 0, 1);
375 if(
this == &in_mat)
return *
this;
376 csc_sorted = in_mat.csc_sorted;
377 csr_sorted = in_mat.csr_sorted;
378 access::rw(
n_rows) = in_mat.n_rows;
379 access::rw(
n_cols) = in_mat.n_cols;
380 access::rw(
n_elem) = in_mat.n_elem;
381 access::rw(
n_alloc) = in_mat.n_alloc;
382 row_idx = std::move(in_mat.row_idx);
383 col_idx = std::move(in_mat.col_idx);
384 val_idx = std::move(in_mat.val_idx);
391 init(index_t(in_mat.n_nonzero));
393 for(
auto I = in_mat.begin(); I != in_mat.end(); ++I)
at(I.row(), I.col()) = *I;
397 : csc_sorted(in_mat.csc_sorted)
398 , csr_sorted(in_mat.csr_sorted)
408 const sp_i auto shift = index_t(base);
410 in_mat.copy_to(row_idx, col_idx, val_idx, 0, shift, shift, 1);
418 invalidate_sorting_flag();
422 return val_idx[access::rw(
n_elem)++] = data_t(0);
426 suanpan_info(
"A sparse matrix in triplet form with size of {} by {}, the density of {:.3f}%.\n",
n_rows,
n_cols,
static_cast<double>(
n_elem) /
static_cast<double>(
n_rows) /
static_cast<double>(
n_cols) * 1E2);
427 if(
n_elem > index_t(1000)) {
431 for(index_t I = 0; I <
n_elem; ++I)
432 suanpan_info(
"({}, {}) ===> {:+.8E}\n", row_idx[I], col_idx[I], val_idx[I]);
452 std::ofstream file(file_name);
453 if(!file.is_open())
return;
455 for(index_t I = 0; I <
n_elem; ++I) file <<
suanpan::format(
"{} {} {}\n", row_idx[I], col_idx[I], val_idx[I]);
473 if(csr_sorted)
return;
475 std::vector<index_t> index(
n_elem);
476 std::iota(index.begin(), index.end(), index_t(0));
480 index_ptr new_row_idx(
new index_t[
n_alloc]);
481 index_ptr new_col_idx(
new index_t[
n_alloc]);
482 data_ptr new_val_idx(
new data_t[
n_alloc]);
485 new_row_idx[I] = row_idx[index[I]];
486 new_col_idx[I] = col_idx[index[I]];
487 new_val_idx[I] = val_idx[index[I]];
490 row_idx = std::move(new_row_idx);
491 col_idx = std::move(new_col_idx);
492 val_idx = std::move(new_val_idx);
512 if(csc_sorted)
return;
514 std::vector<index_t> index(
n_elem);
515 std::iota(index.begin(), index.end(), index_t(0));
519 index_ptr new_row_idx(
new index_t[
n_alloc]);
520 index_ptr new_col_idx(
new index_t[
n_alloc]);
521 data_ptr new_val_idx(
new data_t[
n_alloc]);
524 new_row_idx[I] = row_idx[index[I]];
525 new_col_idx[I] = col_idx[index[I]];
526 new_val_idx[I] = val_idx[index[I]];
529 row_idx = std::move(new_row_idx);
530 col_idx = std::move(new_col_idx);
531 val_idx = std::move(new_val_idx);
538 if(in_mat.empty())
return;
540 invalidate_sorting_flag();
542 const auto t_elem =
n_elem + index_t(in_mat.n_elem);
547 row_idx[n_elem + I] = index_t(in_dof(I % in_dof.n_elem));
548 col_idx[n_elem + I] = index_t(in_dof(I / in_dof.n_elem));
549 val_idx[n_elem + I] = in_mat(I);
552 access::rw(
n_elem) = t_elem;
558 invalidate_sorting_flag();
564 in_mat.copy_to(row_idx, col_idx, val_idx,
n_elem, row_shift, col_shift, scalar);
566 access::rw(
n_elem) = t_elem;
577 suanpan_for_each(copy.val_idx.get(), copy.val_idx.get() + copy.n_elem, [](data_t& I) { I = -I; });
579 suanpan_for_each(copy.val_idx.get(), copy.val_idx.get() + copy.n_elem, [=](data_t& I) { I *= data_t(scalar); });
590 suanpan_for_each(copy.val_idx.get(), copy.val_idx.get() + copy.n_elem, [](data_t& I) { I = -I; });
592 suanpan_for_each(copy.val_idx.get(), copy.val_idx.get() + copy.n_elem, [=](data_t& I) { I /= data_t(scalar); });
623 invalidate_sorting_flag();
629 in_mat.copy_to(row_idx, col_idx, val_idx,
n_elem, 0, 0, 1);
631 access::rw(
n_elem) = t_elem;
639 invalidate_sorting_flag();
645 in_mat.copy_to(row_idx, col_idx, val_idx,
n_elem, 0, 0, -1);
647 access::rw(
n_elem) = t_elem;
653 Col<data_t> diag_vec(std::min(
n_rows,
n_cols), fill::zeros);
654 for(index_t I = 0; I <
n_elem; ++I)
660 auto out_mat = *
this;
662 suanpan::for_each(out_mat.n_elem, [&](
const index_t I) { out_mat.val_idx[I] *= out_mat.row(I) == out_mat.col(I); });
668 auto out_mat = *
this;
670 suanpan::for_each(out_mat.n_elem, [&](
const index_t I) { out_mat.val_idx[I] *= out_mat.row(I) < out_mat.col(I); });
676 auto out_mat = *
this;
678 suanpan::for_each(out_mat.n_elem, [&](
const index_t I) { out_mat.val_idx[I] *= out_mat.col(I) < out_mat.row(I); });
684 auto out_mat = *
this;
686 suanpan::for_each(out_mat.n_elem, [&](
const index_t I) { out_mat.val_idx[I] *= out_mat.row(I) <= out_mat.col(I); });
692 auto out_mat = *
this;
694 suanpan::for_each(out_mat.n_elem, [&](
const index_t I) { out_mat.val_idx[I] *= out_mat.col(I) <= out_mat.row(I); });
707 return std::move(mat_a);
712 return std::move(mat_b);
717 return std::move(mat_a);
Storage< T >::iterator begin(Storage< T > &S)
Definition Storage.hpp:209
Definition triplet_form.hpp:47
bool operator()(const index_t idx_a, const index_t idx_b) const
Definition triplet_form.hpp:56
csc_comparator(const index_t *const in_row_idx, const index_t *const in_col_idx)
Definition triplet_form.hpp:52
Definition triplet_form.hpp:32
bool operator()(const index_t idx_a, const index_t idx_b) const
Definition triplet_form.hpp:41
csr_comparator(const index_t *const in_row_idx, const index_t *const in_col_idx)
Definition triplet_form.hpp:37
bool approx_equal(const T x, const T y, int ulp=2)
Definition utility.h:97
std::string format(const std::string_view format_str, const T &... args)
Definition suanPan.h:302
constexpr T max_element(T start, T end)
Definition utility.h:42
void for_each(const IT start, const IT end, F &&FN)
Definition utility.h:31
#define suanpan_info
Definition suanPan.h:345
auto suanpan_assert(F &&handler)
Definition suanPan.h:339
#define suanpan_for_each
Definition suanPan.h:181
#define suanpan_sort
Definition suanPan.h:180