Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Manage image centers different from (w/2,h/2) #42

Open
wants to merge 2 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions cuda_rasterizer/auxiliary.h
Original file line number Diff line number Diff line change
Expand Up @@ -146,10 +146,10 @@ __forceinline__ __device__ bool in_frustum(int idx,
float3 p_orig = { orig_points[3 * idx], orig_points[3 * idx + 1], orig_points[3 * idx + 2] };

// Bring points to screen space
float4 p_hom = transformPoint4x4(p_orig, projmatrix);
p_view = transformPoint4x3(p_orig, viewmatrix);
float4 p_hom = transformPoint4x4(p_view, projmatrix);
float p_w = 1.0f / (p_hom.w + 0.0000001f);
float3 p_proj = { p_hom.x * p_w, p_hom.y * p_w, p_hom.z * p_w };
p_view = transformPoint4x3(p_orig, viewmatrix);

if (p_view.z <= 0.2f)// || ((p_proj.x < -1.3 || p_proj.x > 1.3 || p_proj.y < -1.3 || p_proj.y > 1.3)))
{
Expand Down
44 changes: 27 additions & 17 deletions cuda_rasterizer/backward.cu
Original file line number Diff line number Diff line change
Expand Up @@ -13,6 +13,7 @@
#include "auxiliary.h"
#include <cooperative_groups.h>
#include <cooperative_groups/reduce.h>
#include <glm/gtc/type_ptr.hpp>
namespace cg = cooperative_groups;

// Backward pass for conversion of spherical harmonics to RGB for
Expand Down Expand Up @@ -145,9 +146,9 @@ __global__ void computeCov2DCUDA(int P,
const float3* means,
const int* radii,
const float* cov3Ds,
const float h_x, float h_y,
const float tan_fovx, float tan_fovy,
const float width, float height,
const float* view_matrix,
const float* projmatrix,
const float* dL_dconics,
float3* dL_dmeans,
float* dL_dcov)
Expand All @@ -156,6 +157,9 @@ __global__ void computeCov2DCUDA(int P,
if (idx >= P || !(radii[idx] > 0))
return;

const float h_x = projmatrix[0] * width / 2.0f;
const float h_y = projmatrix[5] * height / 2.0f;

// Reading location of 3D covariance for this Gaussian
const float* cov3D = cov3Ds + 6 * idx;

Expand All @@ -164,16 +168,19 @@ __global__ void computeCov2DCUDA(int P,
float3 mean = means[idx];
float3 dL_dconic = { dL_dconics[4 * idx], dL_dconics[4 * idx + 1], dL_dconics[4 * idx + 3] };
float3 t = transformPoint4x3(mean, view_matrix);

const float limx = 1.3f * tan_fovx;
const float limy = 1.3f * tan_fovy;

float fx = projmatrix[0], fy = projmatrix[5], cx = projmatrix[8], cy = projmatrix[9];
const float xmin = (-1.3f - cx) / fx;
const float xmax = (1.3f - cx) / fx;
const float ymin = (-1.3f - cy) / fy;
const float ymax = (1.3f - cy) / fy;
const float txtz = t.x / t.z;
const float tytz = t.y / t.z;
t.x = min(limx, max(-limx, txtz)) * t.z;
t.y = min(limy, max(-limy, tytz)) * t.z;
t.x = min(xmax, max(xmin, txtz)) * t.z;
t.y = min(ymax, max(ymin, tytz)) * t.z;

const float x_grad_mul = txtz < -limx || txtz > limx ? 0 : 1;
const float y_grad_mul = tytz < -limy || tytz > limy ? 0 : 1;
const float x_grad_mul = txtz < xmin || txtz > xmax ? 0 : 1;
const float y_grad_mul = tytz < ymin || tytz > ymax ? 0 : 1;

glm::mat3 J = glm::mat3(h_x / t.z, 0.0f, -(h_x * t.x) / (t.z * t.z),
0.0f, h_y / t.z, -(h_y * t.y) / (t.z * t.z),
Expand Down Expand Up @@ -353,7 +360,8 @@ __global__ void preprocessCUDA(
const glm::vec3* scales,
const glm::vec4* rotations,
const float scale_modifier,
const float* proj,
const float* view_matrix,
const float* proj_matrix,
const glm::vec3* campos,
const float3* dL_dmean2D,
glm::vec3* dL_dmeans,
Expand All @@ -370,9 +378,13 @@ __global__ void preprocessCUDA(
float3 m = means[idx];

// Taking care of gradients from the screenspace points
float4 m_hom = transformPoint4x4(m, proj);
float3 view_point = transformPoint4x3(m, view_matrix);
float4 m_hom = transformPoint4x4(view_point, proj_matrix);
float m_w = 1.0f / (m_hom.w + 0.0000001f);

glm::mat4x4 full_proj_matrix = glm::make_mat4(proj_matrix) * glm::make_mat4(view_matrix);
float* proj = (float*)glm::value_ptr(full_proj_matrix);

// Compute loss gradient w.r.t. 3D means due to gradients of 2D means
// from rendering procedure
glm::vec3 dL_dmean;
Expand Down Expand Up @@ -568,8 +580,7 @@ void BACKWARD::preprocess(
const float* cov3Ds,
const float* viewmatrix,
const float* projmatrix,
const float focal_x, float focal_y,
const float tan_fovx, float tan_fovy,
const float width, float height,
const glm::vec3* campos,
const float3* dL_dmean2D,
const float* dL_dconic,
Expand All @@ -589,11 +600,9 @@ void BACKWARD::preprocess(
means3D,
radii,
cov3Ds,
focal_x,
focal_y,
tan_fovx,
tan_fovy,
width, height,
viewmatrix,
projmatrix,
dL_dconic,
(float3*)dL_dmean3D,
dL_dcov3D);
Expand All @@ -610,6 +619,7 @@ void BACKWARD::preprocess(
(glm::vec3*)scales,
(glm::vec4*)rotations,
scale_modifier,
viewmatrix,
projmatrix,
campos,
(float3*)dL_dmean2D,
Expand Down
3 changes: 1 addition & 2 deletions cuda_rasterizer/backward.h
Original file line number Diff line number Diff line change
Expand Up @@ -49,8 +49,7 @@ namespace BACKWARD
const float* cov3Ds,
const float* view,
const float* proj,
const float focal_x, float focal_y,
const float tan_fovx, float tan_fovy,
const float width, float height,
const glm::vec3* campos,
const float3* dL_dmean2D,
const float* dL_dconics,
Expand Down
26 changes: 13 additions & 13 deletions cuda_rasterizer/forward.cu
Original file line number Diff line number Diff line change
Expand Up @@ -71,20 +71,23 @@ __device__ glm::vec3 computeColorFromSH(int idx, int deg, int max_coeffs, const
}

// Forward version of 2D covariance matrix computation
__device__ float3 computeCov2D(const float3& mean, float focal_x, float focal_y, float tan_fovx, float tan_fovy, const float* cov3D, const float* viewmatrix)
__device__ float3 computeCov2D(const float3& mean, float focal_x, float focal_y, const float* cov3D, const float* viewmatrix, const float* projmatrix)
{
// The following models the steps outlined by equations 29
// and 31 in "EWA Splatting" (Zwicker et al., 2002).
// Additionally considers aspect / scaling of viewport.
// Transposes used to account for row-/column-major conventions.
float3 t = transformPoint4x3(mean, viewmatrix);

const float limx = 1.3f * tan_fovx;
const float limy = 1.3f * tan_fovy;
float fx = projmatrix[0], fy = projmatrix[5], cx = projmatrix[8], cy = projmatrix[9];
const float xmin = (-1.3f - cx) / fx;
const float xmax = (1.3f - cx) / fx;
const float ymin = (-1.3f - cy) / fy;
const float ymax = (1.3f - cy) / fy;
const float txtz = t.x / t.z;
const float tytz = t.y / t.z;
t.x = min(limx, max(-limx, txtz)) * t.z;
t.y = min(limy, max(-limy, tytz)) * t.z;
t.x = min(xmax, max(xmin, txtz)) * t.z;
t.y = min(ymax, max(ymin, tytz)) * t.z;

glm::mat3 J = glm::mat3(
focal_x / t.z, 0.0f, -(focal_x * t.x) / (t.z * t.z),
Expand Down Expand Up @@ -167,8 +170,6 @@ __global__ void preprocessCUDA(int P, int D, int M,
const float* projmatrix,
const glm::vec3* cam_pos,
const int W, int H,
const float tan_fovx, float tan_fovy,
const float focal_x, float focal_y,
int* radii,
float2* points_xy_image,
float* depths,
Expand All @@ -183,6 +184,9 @@ __global__ void preprocessCUDA(int P, int D, int M,
if (idx >= P)
return;

const float focal_x = projmatrix[0] * W / 2.0f;
const float focal_y = projmatrix[5] * H / 2.0f;

// Initialize radius and touched tiles to 0. If this isn't changed,
// this Gaussian will not be processed further.
radii[idx] = 0;
Expand All @@ -195,7 +199,7 @@ __global__ void preprocessCUDA(int P, int D, int M,

// Transform point by projecting
float3 p_orig = { orig_points[3 * idx], orig_points[3 * idx + 1], orig_points[3 * idx + 2] };
float4 p_hom = transformPoint4x4(p_orig, projmatrix);
float4 p_hom = transformPoint4x4(p_view, projmatrix);
float p_w = 1.0f / (p_hom.w + 0.0000001f);
float3 p_proj = { p_hom.x * p_w, p_hom.y * p_w, p_hom.z * p_w };

Expand All @@ -213,7 +217,7 @@ __global__ void preprocessCUDA(int P, int D, int M,
}

// Compute 2D screen-space covariance matrix
float3 cov = computeCov2D(p_orig, focal_x, focal_y, tan_fovx, tan_fovy, cov3D, viewmatrix);
float3 cov = computeCov2D(p_orig, focal_x, focal_y, cov3D, viewmatrix, projmatrix);

// Invert covariance (EWA algorithm)
float det = (cov.x * cov.z - cov.y * cov.y);
Expand Down Expand Up @@ -413,8 +417,6 @@ void FORWARD::preprocess(int P, int D, int M,
const float* projmatrix,
const glm::vec3* cam_pos,
const int W, int H,
const float focal_x, float focal_y,
const float tan_fovx, float tan_fovy,
int* radii,
float2* means2D,
float* depths,
Expand All @@ -440,8 +442,6 @@ void FORWARD::preprocess(int P, int D, int M,
projmatrix,
cam_pos,
W, H,
tan_fovx, tan_fovy,
focal_x, focal_y,
radii,
means2D,
depths,
Expand Down
2 changes: 0 additions & 2 deletions cuda_rasterizer/forward.h
Original file line number Diff line number Diff line change
Expand Up @@ -35,8 +35,6 @@ namespace FORWARD
const float* projmatrix,
const glm::vec3* cam_pos,
const int W, int H,
const float focal_x, float focal_y,
const float tan_fovx, float tan_fovy,
int* radii,
float2* points_xy_image,
float* depths,
Expand Down
2 changes: 0 additions & 2 deletions cuda_rasterizer/rasterizer.h
Original file line number Diff line number Diff line change
Expand Up @@ -46,7 +46,6 @@ namespace CudaRasterizer
const float* viewmatrix,
const float* projmatrix,
const float* cam_pos,
const float tan_fovx, float tan_fovy,
const bool prefiltered,
float* out_color,
int* radii = nullptr,
Expand All @@ -66,7 +65,6 @@ namespace CudaRasterizer
const float* viewmatrix,
const float* projmatrix,
const float* campos,
const float tan_fovx, float tan_fovy,
const int* radii,
char* geom_buffer,
char* binning_buffer,
Expand Down
14 changes: 3 additions & 11 deletions cuda_rasterizer/rasterizer_impl.cu
Original file line number Diff line number Diff line change
Expand Up @@ -213,15 +213,11 @@ int CudaRasterizer::Rasterizer::forward(
const float* viewmatrix,
const float* projmatrix,
const float* cam_pos,
const float tan_fovx, float tan_fovy,
const bool prefiltered,
float* out_color,
int* radii,
bool debug)
{
const float focal_y = height / (2.0f * tan_fovy);
const float focal_x = width / (2.0f * tan_fovx);

size_t chunk_size = required<GeometryState>(P);
char* chunkptr = geometryBuffer(chunk_size);
GeometryState geomState = GeometryState::fromChunk(chunkptr, P);
Expand Down Expand Up @@ -259,8 +255,6 @@ int CudaRasterizer::Rasterizer::forward(
viewmatrix, projmatrix,
(glm::vec3*)cam_pos,
width, height,
focal_x, focal_y,
tan_fovx, tan_fovy,
radii,
geomState.means2D,
geomState.depths,
Expand Down Expand Up @@ -351,7 +345,6 @@ void CudaRasterizer::Rasterizer::backward(
const float* viewmatrix,
const float* projmatrix,
const float* campos,
const float tan_fovx, float tan_fovy,
const int* radii,
char* geom_buffer,
char* binning_buffer,
Expand All @@ -377,8 +370,8 @@ void CudaRasterizer::Rasterizer::backward(
radii = geomState.internal_radii;
}

const float focal_y = height / (2.0f * tan_fovy);
const float focal_x = width / (2.0f * tan_fovx);
const float focal_y = 0.f;
const float focal_x = 0.f;

const dim3 tile_grid((width + BLOCK_X - 1) / BLOCK_X, (height + BLOCK_Y - 1) / BLOCK_Y, 1);
const dim3 block(BLOCK_X, BLOCK_Y, 1);
Expand Down Expand Up @@ -420,8 +413,7 @@ void CudaRasterizer::Rasterizer::backward(
cov3D_ptr,
viewmatrix,
projmatrix,
focal_x, focal_y,
tan_fovx, tan_fovy,
width, height,
(glm::vec3*)campos,
(float3*)dL_dmean2D,
dL_dconic,
Expand Down
6 changes: 0 additions & 6 deletions diff_gaussian_rasterization/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -68,8 +68,6 @@ def forward(
cov3Ds_precomp,
raster_settings.viewmatrix,
raster_settings.projmatrix,
raster_settings.tanfovx,
raster_settings.tanfovy,
raster_settings.image_height,
raster_settings.image_width,
sh,
Expand Down Expand Up @@ -116,8 +114,6 @@ def backward(ctx, grad_out_color, _):
cov3Ds_precomp,
raster_settings.viewmatrix,
raster_settings.projmatrix,
raster_settings.tanfovx,
raster_settings.tanfovy,
grad_out_color,
sh,
raster_settings.sh_degree,
Expand Down Expand Up @@ -157,8 +153,6 @@ def backward(ctx, grad_out_color, _):
class GaussianRasterizationSettings(NamedTuple):
image_height: int
image_width: int
tanfovx : float
tanfovy : float
bg : torch.Tensor
scale_modifier : float
viewmatrix : torch.Tensor
Expand Down
8 changes: 0 additions & 8 deletions rasterize_points.cu
Original file line number Diff line number Diff line change
Expand Up @@ -44,8 +44,6 @@ RasterizeGaussiansCUDA(
const torch::Tensor& cov3D_precomp,
const torch::Tensor& viewmatrix,
const torch::Tensor& projmatrix,
const float tan_fovx,
const float tan_fovy,
const int image_height,
const int image_width,
const torch::Tensor& sh,
Expand Down Expand Up @@ -104,8 +102,6 @@ RasterizeGaussiansCUDA(
viewmatrix.contiguous().data<float>(),
projmatrix.contiguous().data<float>(),
campos.contiguous().data<float>(),
tan_fovx,
tan_fovy,
prefiltered,
out_color.contiguous().data<float>(),
radii.contiguous().data<int>(),
Expand All @@ -126,8 +122,6 @@ std::tuple<torch::Tensor, torch::Tensor, torch::Tensor, torch::Tensor, torch::Te
const torch::Tensor& cov3D_precomp,
const torch::Tensor& viewmatrix,
const torch::Tensor& projmatrix,
const float tan_fovx,
const float tan_fovy,
const torch::Tensor& dL_dout_color,
const torch::Tensor& sh,
const int degree,
Expand Down Expand Up @@ -173,8 +167,6 @@ std::tuple<torch::Tensor, torch::Tensor, torch::Tensor, torch::Tensor, torch::Te
viewmatrix.contiguous().data<float>(),
projmatrix.contiguous().data<float>(),
campos.contiguous().data<float>(),
tan_fovx,
tan_fovy,
radii.contiguous().data<int>(),
reinterpret_cast<char*>(geomBuffer.contiguous().data_ptr()),
reinterpret_cast<char*>(binningBuffer.contiguous().data_ptr()),
Expand Down
4 changes: 0 additions & 4 deletions rasterize_points.h
Original file line number Diff line number Diff line change
Expand Up @@ -27,8 +27,6 @@ RasterizeGaussiansCUDA(
const torch::Tensor& cov3D_precomp,
const torch::Tensor& viewmatrix,
const torch::Tensor& projmatrix,
const float tan_fovx,
const float tan_fovy,
const int image_height,
const int image_width,
const torch::Tensor& sh,
Expand All @@ -49,8 +47,6 @@ std::tuple<torch::Tensor, torch::Tensor, torch::Tensor, torch::Tensor, torch::Te
const torch::Tensor& cov3D_precomp,
const torch::Tensor& viewmatrix,
const torch::Tensor& projmatrix,
const float tan_fovx,
const float tan_fovy,
const torch::Tensor& dL_dout_color,
const torch::Tensor& sh,
const int degree,
Expand Down