From dfcfb6d526b61f71ae36959a4113d6343f2646e9 Mon Sep 17 00:00:00 2001
From: Oliver Sander <oliver.sander@tu-dresden.de>
Date: Thu, 25 Feb 2016 21:03:56 +0100
Subject: [PATCH] Remove the 'block' array

This array was a left-over from the VariableBlockVector class.  In short,
it stores the length of each matrix row.  Of course that is redundant,
because all rows in a dense matrix have the same length.

This patch makes the class allocate less memory, and use the known row
size to compute the offsets into the data array.  In principle, the code
becomes faster by this, but I am not convinced that the effect will be
measurable.

Still, even without measurable speedup: this patch is an improvement,
because it makes the code simpler.
---
 dune/istl/matrix.hh | 266 ++++++++++++++++++--------------------------
 1 file changed, 108 insertions(+), 158 deletions(-)

diff --git a/dune/istl/matrix.hh b/dune/istl/matrix.hh
index 29cd3d002..2de082380 100644
--- a/dune/istl/matrix.hh
+++ b/dune/istl/matrix.hh
@@ -60,14 +60,6 @@ namespace MatrixImp
      */
     typedef BlockVector<B,A> block_type;
 
-    /** increment block level counter, yes, it is two levels because
-            DenseMatrixBase is a container of containers
-     */
-    enum {
-      //! The number of blocklevels this vector contains.
-      blocklevel = B::blocklevel+2
-    };
-
     // just a shorthand
     typedef BlockVectorWindow<B,A> window_type;
 
@@ -84,9 +76,8 @@ namespace MatrixImp
     DenseMatrixBase () : block_vector_unmanaged<B,A>()
     {
       // nothing is known ...
-      nblocks = 0;
+      rows_ = 0;
       columns_ = 0;
-      block = 0;
     }
 
     /** make vector with given number of blocks each having a constant size,
@@ -95,11 +86,11 @@ namespace MatrixImp
             \param _nblocks Number of blocks
             \param m Number of elements in each block
      */
-    DenseMatrixBase (size_type _nblocks, size_type m) : block_vector_unmanaged<B,A>()
+    DenseMatrixBase (size_type rows, size_type columns) : block_vector_unmanaged<B,A>()
     {
       // and we can allocate the big array in the base class
-      this->n = _nblocks*m;
-      columns_ = m;
+      this->n = rows*columns;
+      columns_ = columns;
       if (this->n>0)
       {
         this->p = allocator_.allocate(this->n);
@@ -112,22 +103,7 @@ namespace MatrixImp
       }
 
       // we can allocate the windows now
-      nblocks = _nblocks;
-      if (nblocks>0)
-      {
-        // allocate and construct the windows
-        block = windowAllocator_.allocate(nblocks);
-        new (block) window_type[nblocks];
-
-        // set the windows into the big array
-        for (size_type i=0; i<nblocks; ++i)
-          block[i].set(m,this->p+(i*m));
-      }
-      else
-      {
-        nblocks = 0;
-        block = 0;;
-      }
+      rows_ = rows;
     }
 
     //! copy constructor, has copy semantics
@@ -143,32 +119,17 @@ namespace MatrixImp
         new (this->p)B[this->n];
 
         // copy data
-        for (size_type i=0; i<this->n; i++) this->p[i]=a.p[i];
+        for (size_type i=0; i<this->n; i++)
+          this->p[i]=a.p[i];
       }
       else
       {
         this->n = 0;
-        this->p = 0;
+        this->p = nullptr;
       }
 
       // we can allocate the windows now
-      nblocks = a.nblocks;
-      if (nblocks>0)
-      {
-        // alloc
-        block = windowAllocator_.allocate(nblocks);
-        new (block) window_type[nblocks];
-
-        // and we must set the windows
-        block[0].set(a.block[0].getsize(),this->p);           // first block
-        for (size_type i=1; i<nblocks; ++i)                         // and the rest
-          block[i].set(a.block[i].getsize(),block[i-1].getptr()+block[i-1].getsize());
-      }
-      else
-      {
-        nblocks = 0;
-        block = nullptr;
-      }
+      rows_ = a.rows_;
     }
 
     //! free dynamic memory
@@ -180,17 +141,10 @@ namespace MatrixImp
           this->p[--i].~B();
         allocator_.deallocate(this->p,this->n);
       }
-      if (nblocks>0) {
-        size_type i=nblocks;
-        while (i)
-          block[--i].~window_type();
-        windowAllocator_.deallocate(block,nblocks);
-      }
-
     }
 
     //! same effect as constructor with same argument
-    void resize (size_type _nblocks, size_type m)
+    void resize (size_type rows, size_type columns)
     {
       // deconstruct objects and deallocate memory if necessary
       if (this->n>0) {
@@ -199,15 +153,9 @@ namespace MatrixImp
           this->p[--i].~B();
         allocator_.deallocate(this->p,this->n);
       }
-      if (nblocks>0) {
-        size_type i=nblocks;
-        while (i)
-          block[--i].~window_type();
-        windowAllocator_.deallocate(block,nblocks);
-      }
 
       // and we can allocate the big array in the base class
-      this->n = _nblocks*m;
+      this->n = rows*columns;
       if (this->n>0)
       {
         this->p = allocator_.allocate(this->n);
@@ -220,23 +168,8 @@ namespace MatrixImp
       }
 
       // we can allocate the windows now
-      nblocks = _nblocks;
-      columns_ = m;
-      if (nblocks>0)
-      {
-        // allocate and construct objects
-        block = windowAllocator_.allocate(nblocks);
-        new (block) window_type[nblocks];
-
-        // set the windows into the big array
-        for (size_type i=0; i<nblocks; ++i)
-          block[i].set(m,this->p+(i*m));
-      }
-      else
-      {
-        nblocks = 0;
-        block = nullptr;
-      }
+      rows_ = rows;
+      columns_ = columns;
     }
 
     //! assignment
@@ -247,7 +180,7 @@ namespace MatrixImp
         columns_ = a.columns_;
         // reallocate arrays if necessary
         // Note: still the block sizes may vary !
-        if (this->n!=a.n || nblocks!=a.nblocks)
+        if (this->n!=a.n || rows_!=a.rows_)
         {
           // deconstruct objects and deallocate memory if necessary
           if (this->n>0) {
@@ -256,12 +189,6 @@ namespace MatrixImp
               this->p[--i].~B();
             allocator_.deallocate(this->p,this->n);
           }
-          if (nblocks>0) {
-            size_type i=nblocks;
-            while (i)
-              block[--i].~window_type();
-            windowAllocator_.deallocate(block,nblocks);
-          }
 
           // allocate the big array in the base class
           this->n = a.n;
@@ -274,35 +201,16 @@ namespace MatrixImp
           else
           {
             this->n = 0;
-            this->p = 0;
+            this->p = nullptr;
           }
 
-          // we can allocate the windows now
-          nblocks = a.nblocks;
-          if (nblocks>0)
-          {
-            // alloc
-            block = windowAllocator_.allocate(nblocks);
-            new (block) window_type[nblocks];
-          }
-          else
-          {
-            nblocks = 0;
-            block = 0;;
-          }
-        }
-
-        // copy block structure, might be different although
-        // sizes are the same !
-        if (nblocks>0)
-        {
-          block[0].set(a.block[0].getsize(),this->p);                 // first block
-          for (size_type i=1; i<nblocks; ++i)                               // and the rest
-            block[i].set(a.block[i].getsize(),block[i-1].getptr()+block[i-1].getsize());
+          // Copy number of rows
+          rows_ = a.rows_;
         }
 
         // and copy the data
-        for (size_type i=0; i<this->n; i++) this->p[i]=a.p[i];
+        for (size_type i=0; i<this->n; i++)
+          this->p[i]=a.p[i];
       }
 
       return *this;
@@ -350,19 +258,46 @@ namespace MatrixImp
     public:
       //! constructor, no arguments
       Iterator ()
+      : window_(nullptr,0)
       {
-        p = 0;
+        data_ = nullptr;
         i = 0;
       }
 
+      Iterator (Iterator& other) = default;
+      Iterator (Iterator&& other) = default;
+
       //! constructor
-      Iterator (window_type* _p, size_type _i) : p(_p), i(_i)
-      {       }
+      Iterator (B* data, size_type columns, size_type _i)
+      : data_(data), i(_i),
+        window_(data + _i*columns, columns)
+      {}
+
+      /** \brief Move assignment */
+      Iterator& operator=(Iterator&& other)
+      {
+        data_ = other.data_;
+        i = other.i;
+        // Do NOT use window_.operator=, because that copies the window content, not just the window!
+        window_.set(other.window_.getsize(),other.window_.getptr());
+        return *this;
+      }
+
+      /** \brief Copy assignment */
+      Iterator& operator=(Iterator& other)
+      {
+        data_ = other.data_;
+        i = other.i;
+        // Do NOT use window_.operator=, because that copies the window content, not just the window!
+        window_.set(other.window_.getsize(),other.window_.getptr());
+        return *this;
+      }
 
       //! prefix increment
       Iterator& operator++()
       {
         ++i;
+        window_.setptr(window_.getptr()+window_.getsize());
         return *this;
       }
 
@@ -370,43 +305,44 @@ namespace MatrixImp
       Iterator& operator--()
       {
         --i;
+        window_.setptr(window_.getptr()-window_.getsize());
         return *this;
       }
 
       //! equality
       bool operator== (const Iterator& it) const
       {
-        return (p+i)==(it.p+it.i);
+        return window_.getptr() == it.window_.getptr();
       }
 
       //! inequality
       bool operator!= (const Iterator& it) const
       {
-        return (p+i)!=(it.p+it.i);
+        return window_.getptr() != it.window_.getptr();
       }
 
       //! equality
       bool operator== (const ConstIterator& it) const
       {
-        return (p+i)==(it.p+it.i);
+        return window_.getptr() == it.window_.getptr();
       }
 
       //! inequality
       bool operator!= (const ConstIterator& it) const
       {
-        return (p+i)!=(it.p+it.i);
+        return window_.getptr() != it.window_.getptr();
       }
 
       //! dereferencing
       window_type& operator* () const
       {
-        return p[i];
+        return window_;
       }
 
       //! arrow
       window_type* operator-> () const
       {
-        return p+i;
+        return &window_;
       }
 
       // return index corresponding to pointer
@@ -418,52 +354,47 @@ namespace MatrixImp
       friend class ConstIterator;
 
     private:
-      window_type* p;
+      B* data_;
       size_type i;
+      mutable window_type window_;
     };
 
     //! begin Iterator
     Iterator begin ()
     {
-      return Iterator(block,0);
+      return Iterator(this->p, columns_, 0);
     }
 
     //! end Iterator
     Iterator end ()
     {
-      return Iterator(block,nblocks);
+      return Iterator(this->p, columns_, rows_);
     }
 
     //! @returns an iterator that is positioned before
     //! the end iterator of the vector, i.e. at the last entry.
     Iterator beforeEnd ()
     {
-      return Iterator(block,nblocks-1);
+      return Iterator(this->p, columns_, rows_-1);
     }
 
     //! @returns an iterator that is positioned before
     //! the first entry of the vector.
     Iterator beforeBegin () const
     {
-      return Iterator(block,-1);
+      return Iterator(this->p, columns_, -1);
     }
 
     //! random access returning iterator (end if not contained)
     Iterator find (size_type i)
     {
-      if (i>=0 && i<nblocks)
-        return Iterator(block,i);
-      else
-        return Iterator(block,nblocks);
+      return Iterator(this->p, columns_, std::min(i,rows_));
     }
 
     //! random access returning iterator (end if not contained)
     ConstIterator find (size_type i) const
     {
-      if (i>=0 && i<nblocks)
-        return ConstIterator(block,i);
-      else
-        return ConstIterator(block,nblocks);
+      return ConstIterator(this->p, columns_, std::min(i,rows_));
     }
 
     //! ConstIterator class for sequential access
@@ -472,23 +403,47 @@ namespace MatrixImp
     public:
       //! constructor
       ConstIterator ()
+      : window_(nullptr,0)
       {
-        p = 0;
+        data_ = nullptr;
+        columns_ = 0;
         i = 0;
       }
 
       //! constructor from pointer
-      ConstIterator (const window_type* _p, size_type _i) : p(_p), i(_i)
-      {       }
+      ConstIterator (const B* data, size_type columns, size_type _i)
+      : data_(data), i(_i),
+        window_(const_cast<B*>(data + _i * columns), columns)
+      {}
 
       //! constructor from non_const iterator
-      ConstIterator (const Iterator& it) : p(it.p), i(it.i)
-      {       }
+      ConstIterator (const Iterator& it)
+      : data_(it.data_), i(it.i), window_(it.window_.getptr(),it.window_.getsize())
+      {}
+
+      ConstIterator& operator=(Iterator&& other)
+      {
+        data_ = other.data_;
+        i = other.i;
+        // Do NOT use window_.operator=, because that copies the window content, not just the window!
+        window_.set(other.window_.getsize(),other.window_.getptr());
+        return *this;
+      }
+
+      ConstIterator& operator=(Iterator& other)
+      {
+        data_ = other.data_;
+        i = other.i;
+        // Do NOT use window_.operator=, because that copies the window content, not just the window!
+        window_.set(other.window_.getsize(),other.window_.getptr());
+        return *this;
+      }
 
       //! prefix increment
       ConstIterator& operator++()
       {
         ++i;
+        window_.setptr(window_.getptr()+window_.getsize());
         return *this;
       }
 
@@ -496,43 +451,44 @@ namespace MatrixImp
       ConstIterator& operator--()
       {
         --i;
+        window_.setptr(window_.getptr()-window_.getsize());
         return *this;
       }
 
       //! equality
       bool operator== (const ConstIterator& it) const
       {
-        return (p+i)==(it.p+it.i);
+        return window_.getptr() == it.window_.getptr();
       }
 
       //! inequality
       bool operator!= (const ConstIterator& it) const
       {
-        return (p+i)!=(it.p+it.i);
+        return window_.getptr() != it.window_.getptr();
       }
 
       //! equality
       bool operator== (const Iterator& it) const
       {
-        return (p+i)==(it.p+it.i);
+        return window_.getptr() == it.window_.getptr();
       }
 
       //! inequality
       bool operator!= (const Iterator& it) const
       {
-        return (p+i)!=(it.p+it.i);
+        return window_.getptr() != it.window_.getptr();
       }
 
       //! dereferencing
       const window_type& operator* () const
       {
-        return p[i];
+        return window_;
       }
 
       //! arrow
       const window_type* operator-> () const
       {
-        return p+i;
+        return &window_;
       }
 
       // return index corresponding to pointer
@@ -544,8 +500,9 @@ namespace MatrixImp
       friend class Iterator;
 
     private:
-      const window_type* p;
+      const B* data_;
       size_type i;
+      mutable window_type window_;
     };
 
     /** \brief Export the iterator type using std naming rules */
@@ -557,46 +514,42 @@ namespace MatrixImp
     //! begin ConstIterator
     ConstIterator begin () const
     {
-      return ConstIterator(block,0);
+      return ConstIterator(this->p, columns_, 0);
     }
 
     //! end ConstIterator
     ConstIterator end () const
     {
-      return ConstIterator(block,nblocks);
+      return ConstIterator(this->p, columns_, rows_);
     }
 
     //! @returns an iterator that is positioned before
     //! the end iterator of the vector. i.e. at the last element.
     ConstIterator beforeEnd() const
     {
-      return ConstIterator(block,nblocks-1);
+      return ConstIterator(this->p, columns_, rows_-1);
     }
 
     //! end ConstIterator
     ConstIterator rend () const
     {
-      return ConstIterator(block,-1);
+      return ConstIterator(this->p, columns_, -1);
     }
 
-
     //===== sizes
 
     //! number of blocks in the vector (are of variable size here)
     size_type N () const
     {
-      return nblocks;
+      return rows_;
     }
 
 
   private:
-    size_type nblocks;            // number of blocks in vector
+    size_type rows_;            // number of matrix rows
     size_type columns_;           // number of matrix columns
-    window_type* block;     // array of blocks pointing to the array in the base class
 
     A allocator_;
-
-    typename A::template rebind<window_type>::other windowAllocator_;
   };
 
 }  // namespace MatrixImp
@@ -1130,9 +1083,6 @@ namespace MatrixImp
   protected:
 
     /** \brief Abuse DenseMatrixBase as an engine for a 2d array ISTL-style
-
-       This is almost as good as it can get.  Further speedup may be possible by using
-       the fact that all rows have the same length.
      */
     MatrixImp::DenseMatrixBase<T,A> data_;
 
-- 
GitLab