monolish
0.14.0
MONOlithic LIner equation Solvers for Highly-parallel architecture
|
Go to the documentation of this file.
2 #include "../../../include/monolish_vml.hpp"
3 #include "../../internal/monolish_internal.hpp"
958 svadd_core(a, alpha, y);
962 svadd_core(a, alpha, y);
966 svadd_core(a, alpha, y);
970 svadd_core(a, alpha, y);
974 svadd_core(a, alpha, y);
978 svadd_core(a, alpha, y);
982 svadd_core(a, alpha, y);
986 svadd_core(a, alpha, y);
990 svadd_core(a, alpha, y);
993 svadd_core(a, alpha, y);
997 svadd_core(a, alpha, y);
1001 svadd_core(a, alpha, y);
1005 svadd_core(a, alpha, y);
1009 svadd_core(a, alpha, y);
1013 svadd_core(a, alpha, y);
1017 svadd_core(a, alpha, y);
1021 svadd_core(a, alpha, y);
1025 svadd_core(a, alpha, y);
1028 svsub_core(a, alpha, y);
1032 svsub_core(a, alpha, y);
1036 svsub_core(a, alpha, y);
1040 svsub_core(a, alpha, y);
1044 svsub_core(a, alpha, y);
1048 svsub_core(a, alpha, y);
1052 svsub_core(a, alpha, y);
1056 svsub_core(a, alpha, y);
1060 svsub_core(a, alpha, y);
1063 svsub_core(a, alpha, y);
1067 svsub_core(a, alpha, y);
1071 svsub_core(a, alpha, y);
1075 svsub_core(a, alpha, y);
1079 svsub_core(a, alpha, y);
1083 svsub_core(a, alpha, y);
1087 svsub_core(a, alpha, y);
1091 svsub_core(a, alpha, y);
1095 svsub_core(a, alpha, y);
1098 svmul_core(a, alpha, y);
1102 svmul_core(a, alpha, y);
1106 svmul_core(a, alpha, y);
1110 svmul_core(a, alpha, y);
1114 svmul_core(a, alpha, y);
1118 svmul_core(a, alpha, y);
1122 svmul_core(a, alpha, y);
1126 svmul_core(a, alpha, y);
1130 svmul_core(a, alpha, y);
1133 svmul_core(a, alpha, y);
1137 svmul_core(a, alpha, y);
1141 svmul_core(a, alpha, y);
1145 svmul_core(a, alpha, y);
1149 svmul_core(a, alpha, y);
1153 svmul_core(a, alpha, y);
1157 svmul_core(a, alpha, y);
1161 svmul_core(a, alpha, y);
1165 svmul_core(a, alpha, y);
1168 svdiv_core(a, alpha, y);
1172 svdiv_core(a, alpha, y);
1176 svdiv_core(a, alpha, y);
1180 svdiv_core(a, alpha, y);
1184 svdiv_core(a, alpha, y);
1188 svdiv_core(a, alpha, y);
1192 svdiv_core(a, alpha, y);
1196 svdiv_core(a, alpha, y);
1200 svdiv_core(a, alpha, y);
1203 svdiv_core(a, alpha, y);
1207 svdiv_core(a, alpha, y);
1211 svdiv_core(a, alpha, y);
1215 svdiv_core(a, alpha, y);
1219 svdiv_core(a, alpha, y);
1223 svdiv_core(a, alpha, y);
1227 svdiv_core(a, alpha, y);
1231 svdiv_core(a, alpha, y);
1235 svdiv_core(a, alpha, y);
1239 vvpow_core(a, b, y);
1243 vvpow_core(a, b, y);
1247 vvpow_core(a, b, y);
1251 vvpow_core(a, b, y);
1255 vvpow_core(a, b, y);
1259 vvpow_core(a, b, y);
1263 vvpow_core(a, b, y);
1268 vvpow_core(a, b, y);
1273 vvpow_core(a, b, y);
1277 vvpow_core(a, b, y);
1281 vvpow_core(a, b, y);
1285 vvpow_core(a, b, y);
1289 vvpow_core(a, b, y);
1294 vvpow_core(a, b, y);
1299 vvpow_core(a, b, y);
1303 vvpow_core(a, b, y);
1308 vvpow_core(a, b, y);
1313 vvpow_core(a, b, y);
1317 vvpow_core(a, b, y);
1321 vvpow_core(a, b, y);
1325 vvpow_core(a, b, y);
1329 vvpow_core(a, b, y);
1334 vvpow_core(a, b, y);
1339 vvpow_core(a, b, y);
1343 vvpow_core(a, b, y);
1348 vvpow_core(a, b, y);
1353 vvpow_core(a, b, y);
1356 vvpow_core(a, b, y);
1360 vvpow_core(a, b, y);
1364 vvpow_core(a, b, y);
1368 vvpow_core(a, b, y);
1372 vvpow_core(a, b, y);
1376 vvpow_core(a, b, y);
1380 vvpow_core(a, b, y);
1384 vvpow_core(a, b, y);
1388 vvpow_core(a, b, y);
1392 vvpow_core(a, b, y);
1396 vvpow_core(a, b, y);
1400 vvpow_core(a, b, y);
1404 vvpow_core(a, b, y);
1409 vvpow_core(a, b, y);
1414 vvpow_core(a, b, y);
1418 vvpow_core(a, b, y);
1423 vvpow_core(a, b, y);
1428 vvpow_core(a, b, y);
1432 vvpow_core(a, b, y);
1436 vvpow_core(a, b, y);
1440 vvpow_core(a, b, y);
1444 vvpow_core(a, b, y);
1449 vvpow_core(a, b, y);
1454 vvpow_core(a, b, y);
1458 vvpow_core(a, b, y);
1463 vvpow_core(a, b, y);
1468 vvpow_core(a, b, y);
1472 svpow_core(a, alpha, y);
1476 svpow_core(a, alpha, y);
1480 svpow_core(a, alpha, y);
1484 svpow_core(a, alpha, y);
1488 svpow_core(a, alpha, y);
1492 svpow_core(a, alpha, y);
1496 svpow_core(a, alpha, y);
1500 svpow_core(a, alpha, y);
1504 svpow_core(a, alpha, y);
1507 svpow_core(a, alpha, y);
1511 svpow_core(a, alpha, y);
1515 svpow_core(a, alpha, y);
1519 svpow_core(a, alpha, y);
1523 svpow_core(a, alpha, y);
1527 svpow_core(a, alpha, y);
1531 svpow_core(a, alpha, y);
1535 svpow_core(a, alpha, y);
1539 svpow_core(a, alpha, y);
2239 vreciprocal_core(a, y);
2242 vreciprocal_core(a, y);
2246 vreciprocal_core(a, y);
2249 vreciprocal_core(a, y);
2253 vreciprocal_core(a, y);
2257 vreciprocal_core(a, y);
2261 vreciprocal_core(a, y);
2265 vreciprocal_core(a, y);
2269 vreciprocal_core(a, y);
2272 vreciprocal_core(a, y);
2275 vreciprocal_core(a, y);
2279 vreciprocal_core(a, y);
2282 vreciprocal_core(a, y);
2286 vreciprocal_core(a, y);
2290 vreciprocal_core(a, y);
2294 vreciprocal_core(a, y);
2298 vreciprocal_core(a, y);
2302 vreciprocal_core(a, y);
2306 vvmax_core(a, b, y);
2310 vvmax_core(a, b, y);
2314 vvmax_core(a, b, y);
2318 vvmax_core(a, b, y);
2322 vvmax_core(a, b, y);
2326 vvmax_core(a, b, y);
2330 vvmax_core(a, b, y);
2335 vvmax_core(a, b, y);
2340 vvmax_core(a, b, y);
2344 vvmax_core(a, b, y);
2348 vvmax_core(a, b, y);
2352 vvmax_core(a, b, y);
2356 vvmax_core(a, b, y);
2361 vvmax_core(a, b, y);
2366 vvmax_core(a, b, y);
2370 vvmax_core(a, b, y);
2375 vvmax_core(a, b, y);
2380 vvmax_core(a, b, y);
2384 vvmax_core(a, b, y);
2388 vvmax_core(a, b, y);
2392 vvmax_core(a, b, y);
2396 vvmax_core(a, b, y);
2401 vvmax_core(a, b, y);
2406 vvmax_core(a, b, y);
2410 vvmax_core(a, b, y);
2415 vvmax_core(a, b, y);
2420 vvmax_core(a, b, y);
2423 vvmax_core(a, b, y);
2427 vvmax_core(a, b, y);
2431 vvmax_core(a, b, y);
2435 vvmax_core(a, b, y);
2439 vvmax_core(a, b, y);
2443 vvmax_core(a, b, y);
2447 vvmax_core(a, b, y);
2451 vvmax_core(a, b, y);
2455 vvmax_core(a, b, y);
2459 vvmax_core(a, b, y);
2463 vvmax_core(a, b, y);
2467 vvmax_core(a, b, y);
2471 vvmax_core(a, b, y);
2476 vvmax_core(a, b, y);
2481 vvmax_core(a, b, y);
2485 vvmax_core(a, b, y);
2490 vvmax_core(a, b, y);
2495 vvmax_core(a, b, y);
2499 vvmax_core(a, b, y);
2503 vvmax_core(a, b, y);
2507 vvmax_core(a, b, y);
2511 vvmax_core(a, b, y);
2516 vvmax_core(a, b, y);
2521 vvmax_core(a, b, y);
2525 vvmax_core(a, b, y);
2530 vvmax_core(a, b, y);
2535 vvmax_core(a, b, y);
2538 vvmin_core(a, b, y);
2542 vvmin_core(a, b, y);
2546 vvmin_core(a, b, y);
2550 vvmin_core(a, b, y);
2554 vvmin_core(a, b, y);
2558 vvmin_core(a, b, y);
2562 vvmin_core(a, b, y);
2567 vvmin_core(a, b, y);
2572 vvmin_core(a, b, y);
2576 vvmin_core(a, b, y);
2580 vvmin_core(a, b, y);
2584 vvmin_core(a, b, y);
2588 vvmin_core(a, b, y);
2593 vvmin_core(a, b, y);
2598 vvmin_core(a, b, y);
2602 vvmin_core(a, b, y);
2607 vvmin_core(a, b, y);
2612 vvmin_core(a, b, y);
2616 vvmin_core(a, b, y);
2620 vvmin_core(a, b, y);
2624 vvmin_core(a, b, y);
2628 vvmin_core(a, b, y);
2633 vvmin_core(a, b, y);
2638 vvmin_core(a, b, y);
2642 vvmin_core(a, b, y);
2647 vvmin_core(a, b, y);
2652 vvmin_core(a, b, y);
2655 vvmin_core(a, b, y);
2659 vvmin_core(a, b, y);
2663 vvmin_core(a, b, y);
2667 vvmin_core(a, b, y);
2671 vvmin_core(a, b, y);
2675 vvmin_core(a, b, y);
2679 vvmin_core(a, b, y);
2683 vvmin_core(a, b, y);
2687 vvmin_core(a, b, y);
2691 vvmin_core(a, b, y);
2695 vvmin_core(a, b, y);
2699 vvmin_core(a, b, y);
2703 vvmin_core(a, b, y);
2708 vvmin_core(a, b, y);
2713 vvmin_core(a, b, y);
2717 vvmin_core(a, b, y);
2722 vvmin_core(a, b, y);
2727 vvmin_core(a, b, y);
2731 vvmin_core(a, b, y);
2735 vvmin_core(a, b, y);
2739 vvmin_core(a, b, y);
2743 vvmin_core(a, b, y);
2748 vvmin_core(a, b, y);
2753 vvmin_core(a, b, y);
2757 vvmin_core(a, b, y);
2762 vvmin_core(a, b, y);
2767 vvmin_core(a, b, y);
2771 return vmax_core<vector<double>,
double>(y);
2774 return vmax_core<view1D<vector<double>,
double>,
double>(y);
2777 return vmax_core<view1D<matrix::Dense<double>,
double>,
double>(y);
2781 return vmax_core<view1D<vector<float>,
float>,
float>(y);
2784 return vmax_core<view1D<matrix::Dense<float>,
float>,
float>(y);
2787 return vmin_core<vector<double>,
double>(y);
2790 return vmin_core<view1D<vector<double>,
double>,
double>(y);
2793 return vmin_core<view1D<matrix::Dense<double>,
double>,
double>(y);
2797 return vmin_core<view1D<vector<float>,
float>,
float>(y);
2800 return vmin_core<view1D<matrix::Dense<float>,
float>,
float>(y);
void ceil(const matrix::CRS< double > &A, matrix::CRS< double > &C)
ceil to CRS matrix elements (C[0:nnz] = ceil(A[0:nnz]))
void min(const matrix::CRS< double > &A, const matrix::CRS< double > &B, matrix::CRS< double > &C)
Create a new CRS matrix with smallest elements of two matrices (C[0:nnz] = min(A[0:nnz],...
void asinh(const matrix::CRS< double > &A, matrix::CRS< double > &C)
asinh to CRS matrix elements (C[0:nnz] = asinh(A[0:nnz]))
void max(const matrix::CRS< double > &A, const matrix::CRS< double > &B, matrix::CRS< double > &C)
Create a new CRS matrix with greatest elements of two matrices (C[0:nnz] = max(A[0:nnz],...
void sub(const matrix::CRS< double > &A, const matrix::CRS< double > &B, matrix::CRS< double > &C)
element by element subtract CRS matrix A and CRS matrix B.
void sinh(const matrix::CRS< double > &A, matrix::CRS< double > &C)
sinh to CRS matrix elements (C[0:nnz] = sinh(A[0:nnz]))
void sqrt(const matrix::CRS< double > &A, matrix::CRS< double > &C)
sqrt to CRS matrix elements (C[0:nnz] = sqrt(A[0:nnz]))
void reciprocal(const matrix::CRS< double > &a, matrix::CRS< double > &y)
reciprocal to CRS matrix elements (C[0:nnz] = 1 / A[0:nnz])
void sign(const matrix::CRS< double > &A, matrix::CRS< double > &C)
sign to CRS matrix elements (C[0:nnz] = sign(A[0:nnz]))
void floor(const matrix::CRS< double > &A, matrix::CRS< double > &C)
floor to CRS matrix elements (C[0:nnz] = floor(A[0:nnz]))
void div(const matrix::CRS< double > &A, const matrix::CRS< double > &B, matrix::CRS< double > &C)
element by element division CRS matrix A and CRS matrix B.
void tan(const matrix::CRS< double > &A, matrix::CRS< double > &C)
tan to CRS matrix elements (C[0:nnz] = tan(A[0:nnz]))
void add(const matrix::CRS< double > &A, const matrix::CRS< double > &B, matrix::CRS< double > &C)
element by element addition CRS matrix A and CRS matrix B.
void tanh(const matrix::CRS< double > &A, matrix::CRS< double > &C)
tanh to CRS matrix elements (C[0:nnz] = tanh(A[0:nnz]))
void pow(const matrix::CRS< double > &A, const matrix::CRS< double > &B, matrix::CRS< double > &C)
power to CRS matrix elements CRS matrix (C[0:N] = pow(A[0:N], B[0:N]))
void mul(const matrix::CRS< double > &A, const matrix::CRS< double > &B, matrix::CRS< double > &C)
element by element multiplication CRS matrix A and CRS matrix B.
void sin(const matrix::CRS< double > &A, matrix::CRS< double > &C)
sin to CRS matrix elements (C[0:nnz] = sin(A[0:nnz]))
void atanh(const matrix::CRS< double > &A, matrix::CRS< double > &C)
atanh to CRS matrix elements (C[0:nnz] = atanh(A[0:nnz]))
void asin(const matrix::CRS< double > &A, matrix::CRS< double > &C)
asin to CRS matrix elements (C[0:nnz] = asin(A[0:nnz]))
void atan(const matrix::CRS< double > &A, matrix::CRS< double > &C)
atan to CRS matrix elements (C[0:nnz] = atan(A[0:nnz]))