flexBox_CPP/flex_matrix_8h_source.html

 #ifndef flexMatrix_H
 #define flexMatrix_H

 #include "flexLinearOperator.h"

 #include <vector>

 template<typename T>
 class flexMatrix : public flexLinearOperator<T>
 {

 #ifdef __CUDACC__
     typedef thrust::device_vector<T> Tdata;
 #else
     typedef std::vector<T> Tdata;
 #endif

 private:
     std::vector<int> rowToIndexList;
     std::vector<int> indexList;
     Tdata valueList;

 public:
     flexMatrix() : indexList(), valueList(), rowToIndexList(), flexLinearOperator<T>(0, 0, matrixOp, false) {};


     flexMatrix(int aNumRows, int aNumCols, bool aMinus) : rowToIndexList(aNumRows + 1, static_cast<int>(0)), indexList(0, 0), valueList(0, 0), flexLinearOperator<T>(aNumRows, aNumCols, matrixOp, aMinus){};

     flexMatrix<T>* copy()
     {
         flexMatrix<T>* A = new flexMatrix<T>(this->getNumRows(), this->getNumCols(), this->isMinus);

         A->rowToIndexList = rowToIndexList;
         A->indexList = indexList;
         A->valueList = valueList;

         return A;
     }

     void times(bool transposed, const Tdata &input, Tdata &output)
     {

     }

     void timesPlus(bool transposed, const Tdata &input, Tdata &output)
     {
         if (this->isMinus)
         {
             doTimesCPU(transposed, input, output,MINUS);
         }
         else
         {
             doTimesCPU(transposed, input, output,PLUS);
         }
     }

     void timesMinus(bool transposed, const Tdata &input, Tdata &output)
     {
         if (this->isMinus)
         {
             doTimesCPU(transposed, input, output,PLUS);
         }
         else
         {
             doTimesCPU(transposed, input, output,MINUS);
         }
     }


     void blockInsert(std::vector<int> &indexI, const std::vector<int> &indexJ, const Tdata &indexVal)
     {
         //clear matrix
         //clear();

         int numberListElements = (int)indexI.size();

         //initialize vecvector
         std::vector<int> emptyBucket(0, 0);
         std::vector < std::vector<int> > buckets(this->getNumRows(), emptyBucket);

         //add elements to buckets
         for (int indexInput = 0; indexInput < numberListElements; indexInput++)
         {
             int bucketIndex = indexI[indexInput];
             buckets[bucketIndex].push_back(indexInput);
         }

         //go trough all rows:
         for (int indexRow = 0; indexRow < this->getNumRows(); indexRow++)
         {
             int numElements = 0;

             //go through bucket
             for (int indexBucket = 0; indexBucket < (int)buckets[indexRow].size(); indexBucket++)
             {
                 int tmpIndex = buckets[indexRow][indexBucket];

                 indexList.push_back(indexJ[tmpIndex]);
                 valueList.push_back(indexVal[tmpIndex]);
                 ++numElements;
             }

             //update rowToIndexList
             rowToIndexList[indexRow + 1] = rowToIndexList[indexRow] + numElements;
         }
     }

     /*
     //inserts new matrix element val at position [i][j]. This is SLOW!
     void insertElement(int i, int j, T val)
     {
         //get start position of next row
         int startIndexNextRow = rowToIndexList[i + 1];

         int numElt = indexList.size();

         //increment size of index and value list by 1
         indexList.push_back(0);
         valueList.push_back(static_cast<T>(0));
         //indexList.resize(indexList.size() + 1,static_cast<T>(0));
         //valueList.resize(valueList.size() + 1,static_cast<T>(0));

         //shift all elements starting with startIndexNextRow to next position
         for (int index = indexList.size()-1; index > startIndexNextRow; index--)
         {
             indexList[index] = indexList[index - 1];
             valueList[index] = valueList[index - 1];
         }

         //update indexList and valueList at current position
         indexList[startIndexNextRow] = j;
         valueList[startIndexNextRow] = val;

         //increase all elemets above i in rowToIndexList
         for (int index = i + 1; index < numRows+1; index++)
         {
             ++rowToIndexList[index];
         }
     }*/

     T getMaxRowSumAbs(bool transposed)
     {
         std::vector<T> rowSum = this->getAbsRowSum(transposed);

         return *std::max_element(rowSum.begin(), rowSum.end());
     }


     std::vector<T> getAbsRowSum(bool transposed)
     {
         if (transposed)
         {
             std::vector<T> result(this->getNumCols());

             //todo check if omp is possible
             for (int k = 0; k < this->getNumRows(); ++k)
             {
                 for (int index = rowToIndexList[k]; index < rowToIndexList[k + 1]; ++index)
                 {
                     result[indexList[index]] += std::abs(valueList[index]);
                 }
             }

             return result;
         }
         else
         {
             std::vector<T> result(this->getNumRows());

             #pragma omp parallel for
             for (int k = 0; k < this->getNumRows(); ++k)
             {
                 T tmpSum = static_cast<T>(0);
                 for (int index = rowToIndexList[k]; index < rowToIndexList[k + 1]; ++index)
                 {
                     tmpSum += std::abs(valueList[index]);
                 }


                 result[k] = tmpSum;
             }

             return result;
         }
     }


     void printRow(int i)
     {
         for (int index = rowToIndexList[i]; index < rowToIndexList[i+1]; ++index)
         {
             printf("(%d,%d,%f)|", i, indexList[index], valueList[index]);
         }

         printf("\n");
     }

     void printMatrix()
     {
         for (int i = 0; i < this->getNumRows(); i++)
         {
             printRow(i);
         }
     }

     //DUMMY FUNCTION
     #ifdef __CUDACC__
     thrust::device_vector<T> getAbsRowSumCUDA(bool transposed)
     {
         thrust::device_vector<T> result(this->getNumRows(), (T)1);

         return result;
     }
     #endif

     private:
     void doTimesCPU(bool transposed, const Tdata &input, Tdata &output,const mySign s)
     {
         if (transposed)
         {
             //todo: check if transposed multiplication can be parallelized
             for (int i = 0; i < this->getNumRows(); ++i)
             {
                 int indexNext = rowToIndexList[i + 1];
                 for (int index = rowToIndexList[i]; index < indexNext; ++index)
                 {
                     switch (s)
                     {
                         case PLUS:
                         {
                             output[indexList[index]] += input[i] * valueList[index];
                             break;
                         }
                         case MINUS:
                         {
                             output[indexList[index]] -= input[i] * valueList[index];
                             break;
                         }
                     }
                 }
             }
         }
         else
         {
             #pragma omp parallel for
             for (int i = 0; i < this->getNumRows(); ++i)
             {
                 T rowsum = (T)0;
                 // initialize result
                 int indexNext = rowToIndexList[i + 1];
                 for (int index = rowToIndexList[i]; index < indexNext; ++index)
                 {
                     rowsum += input[indexList[index]] * valueList[index];
                 }

                 switch (s)
                 {
                     case PLUS:
                     {
                         output[i] += rowsum;
                         break;
                     }
                     case MINUS:
                     {
                         output[i] -= rowsum;
                         break;
                     }
                 }
             }
         }
     }
 };

 #endif
flexMatrix::getMaxRowSumAbs
T getMaxRowSumAbs(bool transposed)
returns the maximum sum of absolute values per row used for preconditioning
Definition: flexMatrix.h:154

flexLinearOperator::getNumRows
int getNumRows() const
returns number of rows of the linear operator
Definition: flexLinearOperator.h:57

flexMatrix::getAbsRowSum
std::vector< T > getAbsRowSum(bool transposed)
returns a vector of sum of absolute values per row used for preconditioning
Definition: flexMatrix.h:162

flexLinearOperator::isMinus
bool isMinus
determines if operator is negated
Definition: flexLinearOperator.h:25

flexMatrix
represents a (non-CUDA) matrix
Definition: flexMatrix.h:10

flexMatrix::timesMinus
void timesMinus(bool transposed, const Tdata &input, Tdata &output)
applies linear operator on vector and substracts its result from y
Definition: flexMatrix.h:64

flexMatrix::blockInsert
void blockInsert(std::vector< int > &indexI, const std::vector< int > &indexJ, const Tdata &indexVal)
inserts data into matrix
Definition: flexMatrix.h:83

flexLinearOperator::getNumCols
int getNumCols() const
returns number of columns of the linear operator
Definition: flexLinearOperator.h:48

flexMatrix::timesPlus
void timesPlus(bool transposed, const Tdata &input, Tdata &output)
applies linear operator on vector and adds its result to y
Definition: flexMatrix.h:52

flexMatrix::flexMatrix
flexMatrix()
initializes an empty matrix
Definition: flexMatrix.h:26

flexMatrix::copy
flexMatrix< T > * copy()
copies the linear operator
Definition: flexMatrix.h:36

flexMatrix::getAbsRowSumCUDA
thrust::device_vector< T > getAbsRowSumCUDA(bool transposed)
same function as getAbsRowSum() but implemented in CUDA
Definition: flexMatrix.h:225

flexMatrix::flexMatrix
flexMatrix(int aNumRows, int aNumCols, bool aMinus)
initializes a matrix
Definition: flexMatrix.h:34

mySign
mySign
enum representing the type of concatenation
Definition: tools.h:56

flexMatrix::times
void times(bool transposed, const Tdata &input, Tdata &output)
applies linear operator on vector
Definition: flexMatrix.h:47

flexLinearOperator
abstract base class for linear operators
Definition: flexLinearOperator.h:12

flexMatrix::printMatrix
void printMatrix()
prints the whole matrix
Definition: flexMatrix.h:215

flexMatrix::printRow
void printRow(int i)
prints requested row
Definition: flexMatrix.h:204