Add in a better version of 3d scheduling to the serial backend.

This is the first step to having better 3d scheduling for the serial backend. While this doesn't improve the performance, it lays the foundation for allowing I,J,K indexing when iterating Cells of a uniform grid.
2024-10-06 02:18:58 +00:00 · 2015-03-13 16:40:36 -04:00 · 2015-03-13 16:40:36 -04:00 · 18dbdd5d52
commit 18dbdd5d52
parent 73d27435f1
1 changed files with 66 additions and 8 deletions
--- a/vtkm/cont/internal/DeviceAdapterAlgorithmSerial.h
+++ b/vtkm/cont/internal/DeviceAdapterAlgorithmSerial.h
@ -255,10 +255,11 @@ public:
    DeviceAdapterAlgorithm<Device>::ScheduleKernel<Functor> kernel(functor);
-    std::for_each(
+    const vtkm::Id size = numInstances;
-          ::boost::counting_iterator<vtkm::Id>(0),
+    for(vtkm::Id i=0; i < size; ++i)
-          ::boost::counting_iterator<vtkm::Id>(numInstances),
+      {
-          kernel);
+      kernel(i);
      }
    if (errorMessage.IsErrorRaised())
    {
@ -266,12 +267,69 @@ public:
    }
  }
 private:
  // This runs in the execution environment.
  template<class FunctorType>
-  VTKM_CONT_EXPORT
+  class ScheduleKernel3D
  static void Schedule(FunctorType functor, vtkm::Id3 rangeMax)
  {
-    DeviceAdapterAlgorithm<Device>::Schedule(functor,
+  public:
-                                     rangeMax[0] * rangeMax[1] * rangeMax[2] );
+    ScheduleKernel3D(vtkm::Id3 dims,
                     const FunctorType &functor)
      : Dims(dims), Functor(functor) {  }
    //needed for when calling from schedule on a i,j,k range
    VTKM_EXEC_EXPORT void operator()(vtkm::Id3 indexIJK) const
    {
      //convert from the id3 index to flat index space, as this is a placeholder
      //algorithm while we wait for the ability to pass i,j,k indexes down
      //the scheduling pipeline
      const vtkm::Id flatIndex = indexIJK[0] +
              this->Dims[0] * ( indexIJK[1] + this->Dims[1]* indexIJK[2] );
      Functor(flatIndex);
    }
  private:
    vtkm::Id3 Dims;
    const FunctorType Functor;
  };
 public:
  template<class Functor>
  VTKM_CONT_EXPORT
  static void Schedule(Functor functor, vtkm::Id3 rangeMax)
  {
    const vtkm::Id MESSAGE_SIZE = 1024;
    char errorString[MESSAGE_SIZE];
    errorString[0] = '\0';
    vtkm::exec::internal::ErrorMessageBuffer
        errorMessage(errorString, MESSAGE_SIZE);
    functor.SetErrorMessageBuffer(errorMessage);
    DeviceAdapterAlgorithm<Device>::ScheduleKernel3D<Functor> kernel(rangeMax,
                                                                     functor);
    //use a const variable to hint to compiler this doesn't change
    const vtkm::Id3 sizes = rangeMax;
    vtkm::Id3 ijkIndex(0,0,0);
    for(vtkm::Id k=0; k < sizes[2]; ++k)
      {
      ijkIndex[2] = k;
      for(vtkm::Id j=0; j < sizes[1]; ++j)
        {
        ijkIndex[1] = j;
        for(vtkm::Id i=0; i < sizes[0]; ++i)
          {
          ijkIndex[0] = i;
          kernel( ijkIndex );
          }
        }
      }
    if (errorMessage.IsErrorRaised())
    {
      throw vtkm::cont::ErrorExecution(errorString);
    }
  }
  template<typename T, class Storage>