Revert "Split the code which generates vertices and indices for a single cell into a separate function."

This reverts commit 2fa291d16f.
2015-05-29 17:28:07 +02:00
parent 942bb37981
commit 96e747d0c3
1 changed files with 182 additions and 196 deletions
--- a/include/PolyVox/MarchingCubesSurfaceExtractor.inl
+++ b/include/PolyVox/MarchingCubesSurfaceExtractor.inl
@@ -49,13 +49,92 @@ namespace PolyVox
 	}

 	template< typename VolumeType, typename MeshType, typename ControllerType >
-	void generateMeshForCell(Region& region, MeshType* result, ControllerType& controller, typename VolumeType::Sampler& sampler, Array<2, Vector3DInt32>& pIndices, Array<2, Vector3DInt32>& pPreviousIndices, uint8_t iCubeIndex, uint32_t uXRegSpace, uint32_t uYRegSpace, uint32_t uZRegSpace, typename ControllerType::DensityType tThreshold)
+	void extractMarchingCubesMeshCustom(VolumeType* volData, Region region, MeshType* result, ControllerType controller)
+	{		
+		POLYVOX_THROW_IF(result == nullptr, std::invalid_argument, "Provided mesh cannot be null");
+
+		Timer timer;
+		result->clear();
+
+		typename ControllerType::DensityType tThreshold = controller.getThreshold();
+
+		const uint32_t uRegionWidthInVoxels = region.getWidthInVoxels();
+		const uint32_t uRegionHeightInVoxels = region.getHeightInVoxels();
+		const uint32_t uRegionDepthInVoxels = region.getDepthInVoxels();
+
+		// No need to clear memory because we only read from elements we have written to.
+		Array<2, Vector3DInt32> pIndices(uRegionWidthInVoxels, uRegionHeightInVoxels);
+		Array<2, Vector3DInt32> pPreviousIndices(uRegionWidthInVoxels, uRegionHeightInVoxels);
+
+		Array2DUint8 pPreviousSliceBitmask(uRegionWidthInVoxels, uRegionHeightInVoxels);
+		Array1DUint8 pPreviousRowBitmask(uRegionWidthInVoxels);
+
+		uint8_t uPreviousCell = 0;
+
+		typename VolumeType::Sampler startOfSlice(volData);
+		startOfSlice.setPosition(region.getLowerX(), region.getLowerY(), region.getLowerZ());
+
+		for (uint32_t uZRegSpace = 0; uZRegSpace < uRegionDepthInVoxels; uZRegSpace++)
+		{
+			typename VolumeType::Sampler startOfRow = startOfSlice;
+
+			for (uint32_t uYRegSpace = 0; uYRegSpace < uRegionHeightInVoxels; uYRegSpace++)
+			{
+				// Copying a sampler which is already pointing at the correct location seems (slightly) faster than
+				// calling setPosition(). Therefore we make use of 'startOfRow' and 'startOfSlice' to reset the sampler.
+				typename VolumeType::Sampler sampler = startOfRow;
+
+				for (uint32_t uXRegSpace = 0; uXRegSpace < uRegionWidthInVoxels; uXRegSpace++)
+				{
+					// Note: In many cases the provided region will be (mostly) empty which means mesh vertices/indices 
+					// are not generated and the only thing that is done for each cell is the computation of iCubeIndex.
+					// It appears that retriving the voxel value is not so expensive and that it is the bitwise combining
+					// which actually carries the cost.
+					//
+					// If we really need to speed this up more then it may be possible to pack 4 8-bit cell indices into
+					// a single 32-bit value and then perform the bitwise logic on all four of them at the same time. 
+					// However, this complicates the code and there would still be the cost of packing/unpacking so it's
+					// not clear if there is really a benefit. It's something to consider in the future.
+
+					uint8_t iCubeIndex = 0;
+
+					// Four bits of our cube index are obtained by looking at the cube index for
+					// the previous slice and copying four of those bits into their new positions.
+					uint8_t iPreviousCubeIndexZ = pPreviousSliceBitmask(uXRegSpace, uYRegSpace);
+					iPreviousCubeIndexZ >>= 4;
+					iCubeIndex |= iPreviousCubeIndexZ;
+
+					// Two bits of our cube index are obtained by looking at the cube index for
+					// the previous row and copying two of those bits into their new positions.
+					uint8_t iPreviousCubeIndexY = pPreviousRowBitmask(uXRegSpace);
+					iPreviousCubeIndexY &= 204; //204 = 128+64+8+4
+					iPreviousCubeIndexY >>= 2;
+					iCubeIndex |= iPreviousCubeIndexY;
+
+					// One bit of our cube index are obtained by looking at the cube index for
+					// the previous cell and copying one of those bits into it's new position.
+					uint8_t iPreviousCubeIndexX = uPreviousCell;
+					iPreviousCubeIndexX &= 170; //170 = 128+32+8+2
+					iPreviousCubeIndexX >>= 1;
+					iCubeIndex |= iPreviousCubeIndexX;
+
+					// The last bit of our cube index is obtained by looking
+					// at the relevant voxel and comparing it to the threshold
+					typename VolumeType::VoxelType v111 = sampler.getVoxel();
+					if (controller.convertToDensity(v111) < tThreshold) iCubeIndex |= 128;
+
+					// The current value becomes the previous value, ready for the next iteration.
+					uPreviousCell = iCubeIndex;
+					pPreviousRowBitmask(uXRegSpace) = iCubeIndex;
+					pPreviousSliceBitmask(uXRegSpace, uYRegSpace) = iCubeIndex;
+
+					/* Cube is entirely in/out of the surface */
+					uint16_t uEdge = edgeTable[iCubeIndex];
+					if (uEdge != 0)
 					{
-		auto v111 = sampler.getVoxel();
 						auto v111Density = controller.convertToDensity(v111);
 						const Vector3DFloat n000 = computeCentralDifferenceGradient(sampler, controller);

-		uint16_t uEdge = edgeTable[iCubeIndex];
 						/* Find the vertices where the surface intersects the cube */
 						if ((uEdge & 64) && (uXRegSpace > 0))
 						{
@@ -232,99 +311,6 @@ namespace PolyVox
 								}
 							} // For each triangle
 						}
-	}
-
-	template< typename VolumeType, typename MeshType, typename ControllerType >
-	void extractMarchingCubesMeshCustom(VolumeType* volData, Region region, MeshType* result, ControllerType controller)
-	{		
-		POLYVOX_THROW_IF(result == nullptr, std::invalid_argument, "Provided mesh cannot be null");
-
-		Timer timer;
-		result->clear();
-
-		typename ControllerType::DensityType tThreshold = controller.getThreshold();
-
-		const uint32_t uRegionWidthInVoxels = region.getWidthInVoxels();
-		const uint32_t uRegionHeightInVoxels = region.getHeightInVoxels();
-		const uint32_t uRegionDepthInVoxels = region.getDepthInVoxels();
-
-		// No need to clear memory because we only read from elements we have written to.
-		Array<2, Vector3DInt32> pIndices(uRegionWidthInVoxels, uRegionHeightInVoxels);
-		Array<2, Vector3DInt32> pPreviousIndices(uRegionWidthInVoxels, uRegionHeightInVoxels);
-
-		Array2DUint8 pPreviousSliceBitmask(uRegionWidthInVoxels, uRegionHeightInVoxels);
-		Array1DUint8 pPreviousRowBitmask(uRegionWidthInVoxels);
-
-		uint8_t uPreviousCell = 0;
-
-		typename VolumeType::Sampler startOfSlice(volData);
-		startOfSlice.setPosition(region.getLowerX(), region.getLowerY(), region.getLowerZ());
-
-		for (uint32_t uZRegSpace = 0; uZRegSpace < uRegionDepthInVoxels; uZRegSpace++)
-		{
-			typename VolumeType::Sampler startOfRow = startOfSlice;
-
-			for (uint32_t uYRegSpace = 0; uYRegSpace < uRegionHeightInVoxels; uYRegSpace++)
-			{
-				// Copying a sampler which is already pointing at the correct location seems (slightly) faster than
-				// calling setPosition(). Therefore we make use of 'startOfRow' and 'startOfSlice' to reset the sampler.
-				typename VolumeType::Sampler sampler = startOfRow;
-
-				for (uint32_t uXRegSpace = 0; uXRegSpace < uRegionWidthInVoxels; uXRegSpace++)
-				{
-					// Note: In many cases the provided region will be (mostly) empty which means mesh vertices/indices 
-					// are not generated and the only thing that is done for each cell is the computation of iCubeIndex.
-					// It appears that retriving the voxel value is not so expensive and that it is the bitwise combining
-					// which actually carries the cost.
-					//
-					// If we really need to speed this up more then it may be possible to pack 4 8-bit cell indices into
-					// a single 32-bit value and then perform the bitwise logic on all four of them at the same time. 
-					// However, this complicates the code and there would still be the cost of packing/unpacking so it's
-					// not clear if there is really a benefit. It's something to consider in the future.
-
-					uint8_t iCubeIndex = 0;
-
-					// Four bits of our cube index are obtained by looking at the cube index for
-					// the previous slice and copying four of those bits into their new positions.
-					uint8_t iPreviousCubeIndexZ = pPreviousSliceBitmask(uXRegSpace, uYRegSpace);
-					iPreviousCubeIndexZ >>= 4;
-					iCubeIndex |= iPreviousCubeIndexZ;
-
-					// Two bits of our cube index are obtained by looking at the cube index for
-					// the previous row and copying two of those bits into their new positions.
-					uint8_t iPreviousCubeIndexY = pPreviousRowBitmask(uXRegSpace);
-					iPreviousCubeIndexY &= 204; //204 = 128+64+8+4
-					iPreviousCubeIndexY >>= 2;
-					iCubeIndex |= iPreviousCubeIndexY;
-
-					// One bit of our cube index are obtained by looking at the cube index for
-					// the previous cell and copying one of those bits into it's new position.
-					uint8_t iPreviousCubeIndexX = uPreviousCell;
-					iPreviousCubeIndexX &= 170; //170 = 128+32+8+2
-					iPreviousCubeIndexX >>= 1;
-					iCubeIndex |= iPreviousCubeIndexX;
-
-					// The last bit of our cube index is obtained by looking
-					// at the relevant voxel and comparing it to the threshold
-					typename VolumeType::VoxelType v111 = sampler.getVoxel();
-					if (controller.convertToDensity(v111) < tThreshold) iCubeIndex |= 128;
-
-					// The current value becomes the previous value, ready for the next iteration.
-					uPreviousCell = iCubeIndex;
-					pPreviousRowBitmask(uXRegSpace) = iCubeIndex;
-					pPreviousSliceBitmask(uXRegSpace, uYRegSpace) = iCubeIndex;
-
-					/* Cube is entirely in/out of the surface */					
-					if (edgeTable[iCubeIndex] != 0)
-					{
-						// This is a rather ugly function call and appears to have some cost compared to inlining the code.
-						// As a result the case when a cell contains vertices/indices is slightly slower, but the (more common)
-						// case where a cell is empty is slightly faster, probably because the main loop is a lot more compact.
-						// Having a seperate function will also make it easier to profile in the future and see whether empty or
-						// occupied cells are really the bottleneck. The large number of parameters is messy though, so it
-						// would be nice to reduce these if we can work out how.
-						generateMeshForCell<VolumeType, MeshType, ControllerType>(region, result, controller, 
-							sampler, pIndices, pPreviousIndices, iCubeIndex, uXRegSpace, uYRegSpace, uZRegSpace, tThreshold);
 					} // For each cell
 					sampler.movePositiveX();
 				} // For X